{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 181013060 黄嘉慧"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 对猎聘PC版进行数据爬取"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "- [猎聘](https://www.liepin.com/zhaopin/)以“产品经理”关键词为例。\n",
    "- 对公司、行业、城市三个不同参数的进行数据（文本、链接）的抓取。\n",
    "- 解析url参数，并建构参数模版。\n",
    "- 创建payload（翻页）模版，\n",
    "- xpath解析页面数据，\n",
    "- 翻页（可参考之前翻页参数模版）"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[<Element 'div' class=('search-conditions',) data-selector='search-conditions'>]\n",
      "<Element 'div' class=('search-conditions',) data-selector='search-conditions'>\n",
      "[<Element 'dt' class=('search-title',)>, <Element 'dt' class=('search-title',)>, <Element 'dt' class=('search-title',)>, <Element 'dt' class=('search-title',)>, <Element 'dt' class=('search-title',)>]\n",
      "公司：\n",
      "行业：\n",
      "城市：\n",
      "薪资：\n",
      "更多：\n",
      "<Element 'dd' class=('comp-list',)>\n",
      "<Element 'dd' class=('short-dd', 'select-industry') data-param='industries'>\n",
      "<Element 'dd' data-param='city'>\n",
      "<Element 'dd' data-param='salary'>\n",
      "<Element 'dd' class=('dropdown', 'dropdown-time')>\n",
      "<Element 'dd' class=('dropdown', 'dropdown-jobkind')>\n",
      "<Element 'dd' class=('dropdown', 'dropdown-compscale')>\n",
      "<Element 'dd' class=('dropdown', 'dropdown-compkind')>\n"
     ]
    }
   ],
   "source": [
    "# 对网页分类栏的文本类型抓取\n",
    "import pandas as pd\n",
    "from requests_html import HTMLSession\n",
    "\n",
    "url = \"https://www.liepin.com/zhaopin/?keyword=人力资源\"\n",
    "session = HTMLSession()\n",
    "r = session.get( url )\n",
    "\n",
    "主要元素 = r.html.xpath('//div[@data-selector=\"search-conditions\"]')\n",
    "\n",
    "print (主要元素)\n",
    "print (主要元素[0])\n",
    "print (主要元素[0].xpath('//dt[@class=\"search-title\"]'))\n",
    "\n",
    "list_search_title = 主要元素[0].xpath('//dt[@class=\"search-title\"]')\n",
    "for x in list_search_title:\n",
    "    print (x.text)\n",
    "    \n",
    "list_search_dd = 主要元素[0].xpath('//dt[@class=\"search-title\"]/following-sibling::dd')\n",
    "for x in list_search_dd:\n",
    "    print (x)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'中国500强': '/zhaopin/?init=-1&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&compTag=155&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '2018互联网300强': '/zhaopin/?init=-1&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&compTag=182&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '制造业500强': '/zhaopin/?init=-1&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&compTag=186&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " 'AI创新成长50强 ': '/zhaopin/?init=-1&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&compTag=189&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '独角兽': '/zhaopin/?init=-1&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&compTag=130&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '上市公司': '/zhaopin/?init=-1&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&compTag=156&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4'}"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 爬取公司的数据\n",
    "# 对城市的数据（链接、文本）抓取\n",
    "公司数据选择器链结 = r.html.xpath('//div[@data-selector=\"search-conditions\"]')[0] \\\n",
    "                    .xpath('//dt[@class=\"search-title\"]/following-sibling::dd')[0] \\\n",
    "                    .xpath('//div[contains(@class,\"hot-comp-tags\")]/a')\n",
    "公司数据选择器链结\n",
    "\n",
    "公司数据选择器链结 = { x.xpath(\"a/text()\")[0]:x.xpath(\"a/@href\")[0] for x in 公司数据选择器链结}\n",
    "公司数据选择器链结"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### urllib模块功能介绍"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "- urlparse 返回的6个部分，分别是：scheme(机制)丶netloc(网络位置)丶path(路径)丶params(路径段参数)丶query(查询)丶fragment(片段)。\n",
    "- parse_qs 返回query(查询)多个部分"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<class 'pandas.core.frame.DataFrame'>\n",
      "RangeIndex: 6 entries, 0 to 5\n",
      "Data columns (total 6 columns):\n",
      "scheme      6 non-null object\n",
      "netloc      6 non-null object\n",
      "path        6 non-null object\n",
      "params      6 non-null object\n",
      "query       6 non-null object\n",
      "fragment    6 non-null object\n",
      "dtypes: object(6)\n",
      "memory usage: 368.0+ bytes\n",
      "scheme      1\n",
      "netloc      1\n",
      "path        1\n",
      "params      1\n",
      "query       6\n",
      "fragment    1\n",
      "dtype: int64\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>scheme</th>\n",
       "      <th>netloc</th>\n",
       "      <th>path</th>\n",
       "      <th>params</th>\n",
       "      <th>query</th>\n",
       "      <th>fragment</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;headckid=8048cb4ce04891b3&amp;flushckid=1&amp;...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;headckid=8048cb4ce04891b3&amp;flushckid=1&amp;...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;headckid=8048cb4ce04891b3&amp;flushckid=1&amp;...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;headckid=8048cb4ce04891b3&amp;flushckid=1&amp;...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;headckid=8048cb4ce04891b3&amp;flushckid=1&amp;...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "  scheme netloc       path params  \\\n",
       "0                /zhaopin/          \n",
       "1                /zhaopin/          \n",
       "2                /zhaopin/          \n",
       "3                /zhaopin/          \n",
       "4                /zhaopin/          \n",
       "\n",
       "                                               query fragment  \n",
       "0  init=-1&headckid=8048cb4ce04891b3&flushckid=1&...           \n",
       "1  init=-1&headckid=8048cb4ce04891b3&flushckid=1&...           \n",
       "2  init=-1&headckid=8048cb4ce04891b3&flushckid=1&...           \n",
       "3  init=-1&headckid=8048cb4ce04891b3&flushckid=1&...           \n",
       "4  init=-1&headckid=8048cb4ce04891b3&flushckid=1&...           "
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 对于城市爬取出来的url，使用urllib3 解析 url\n",
    "\n",
    "from urllib.parse import urlparse, parse_qs # 详细看上面urllib模块的介绍。\n",
    "df = pd.DataFrame([ urlparse(x) for x in 公司数据选择器链结.values()])\n",
    "df.info()\n",
    "print(df.nunique()) # 用nunique这个函数可以查看数据有多少个不同值。\n",
    "df.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "ckid             1\n",
      "compTag          6\n",
      "d_ckId           1\n",
      "d_curPage        1\n",
      "d_headId         1\n",
      "d_pageSize       1\n",
      "d_sfrom          1\n",
      "flushckid        1\n",
      "fromSearchBtn    1\n",
      "headckid         1\n",
      "init             1\n",
      "keyword          1\n",
      "siTag            1\n",
      "dtype: int64\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>ckid</th>\n",
       "      <th>compTag</th>\n",
       "      <th>d_ckId</th>\n",
       "      <th>d_curPage</th>\n",
       "      <th>d_headId</th>\n",
       "      <th>d_pageSize</th>\n",
       "      <th>d_sfrom</th>\n",
       "      <th>flushckid</th>\n",
       "      <th>fromSearchBtn</th>\n",
       "      <th>headckid</th>\n",
       "      <th>init</th>\n",
       "      <th>keyword</th>\n",
       "      <th>siTag</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>155</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>0</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>-1</td>\n",
       "      <td>人力资源</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>182</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>0</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>-1</td>\n",
       "      <td>人力资源</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>186</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>0</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>-1</td>\n",
       "      <td>人力资源</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>189</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>0</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>-1</td>\n",
       "      <td>人力资源</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>130</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>0</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>-1</td>\n",
       "      <td>人力资源</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "               ckid compTag                            d_ckId d_curPage  \\\n",
       "0  8048cb4ce04891b3     155  521f01d84c3b99bf56614979c8dfdbb4         0   \n",
       "1  8048cb4ce04891b3     182  521f01d84c3b99bf56614979c8dfdbb4         0   \n",
       "2  8048cb4ce04891b3     186  521f01d84c3b99bf56614979c8dfdbb4         0   \n",
       "3  8048cb4ce04891b3     189  521f01d84c3b99bf56614979c8dfdbb4         0   \n",
       "4  8048cb4ce04891b3     130  521f01d84c3b99bf56614979c8dfdbb4         0   \n",
       "\n",
       "                           d_headId d_pageSize         d_sfrom flushckid  \\\n",
       "0  521f01d84c3b99bf56614979c8dfdbb4         40  search_unknown         1   \n",
       "1  521f01d84c3b99bf56614979c8dfdbb4         40  search_unknown         1   \n",
       "2  521f01d84c3b99bf56614979c8dfdbb4         40  search_unknown         1   \n",
       "3  521f01d84c3b99bf56614979c8dfdbb4         40  search_unknown         1   \n",
       "4  521f01d84c3b99bf56614979c8dfdbb4         40  search_unknown         1   \n",
       "\n",
       "  fromSearchBtn          headckid init keyword  \\\n",
       "0             2  8048cb4ce04891b3   -1    人力资源   \n",
       "1             2  8048cb4ce04891b3   -1    人力资源   \n",
       "2             2  8048cb4ce04891b3   -1    人力资源   \n",
       "3             2  8048cb4ce04891b3   -1    人力资源   \n",
       "4             2  8048cb4ce04891b3   -1    人力资源   \n",
       "\n",
       "                                           siTag  \n",
       "0  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "1  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "2  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "3  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "4  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  "
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 通过url的解析，看出了在url中只有query值不同，因此我们做下一步针对query 再解析\n",
    "\n",
    "#df_qs = pd.DataFrame([ parse_qs(x) for x in df['query'] ])\n",
    "df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "print (df_qs.nunique())\n",
    "df_qs.head()\n",
    "#df_qs[['keyword','compTag']] 抓取表格中的某个值"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "- comTag 是不同的公司选择器, 不同数值, 对映到不同类型的公司\n",
    "- keyword 是搜查关键字"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'init': ['-1'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'keyword': ['人力资源'], 'compTag': ['155'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}\n",
      "{'中国500强': '155', '2018互联网300强': '182', '制造业500强': '186', 'AI创新成长50强 ': '189', '独角兽': '130', '上市公司': '156'}\n"
     ]
    }
   ],
   "source": [
    "# 建构城市的参数模板 及 字典_compTag\n",
    "def parse_url_qs_for_compTag (url):\n",
    "    six_parts = urlparse(url) \n",
    "    out = parse_qs(six_parts.query)\n",
    "    return (out)\n",
    "\n",
    "#1.输出第一条解析的url\n",
    "# parse_url_qs_for_compTag(list(公司数据选择器链结.values())[0])['compTag']\n",
    "参数模板 = parse_url_qs_for_compTag(list(公司数据选择器链结.values())[0])\n",
    "print(参数模板)\n",
    "\n",
    "# 2.选取表格中的comptag的值\n",
    "[ parse_url_qs_for_compTag(x)['compTag'] for x in 公司数据选择器链结.values()]\n",
    "#[ parse_url_qs_for_compTag(x)['compTag'][0] for x in 公司数据选择器链结.values()]\n",
    "\n",
    "# 3.加上文本说明后的字典\n",
    "字典_compTag = { k:parse_url_qs_for_compTag(v)['compTag'][0] for k,v in 公司数据选择器链结.items()}\n",
    "print (字典_compTag)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'中国500强': {'init': ['-1'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'keyword': ['用户体验'], 'compTag': ['155'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '2018互联网300强': {'init': ['-1'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'keyword': ['用户体验'], 'compTag': ['182'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '制造业500强': {'init': ['-1'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'keyword': ['用户体验'], 'compTag': ['186'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, 'AI创新成长50强 ': {'init': ['-1'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'keyword': ['用户体验'], 'compTag': ['189'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '独角兽': {'init': ['-1'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'keyword': ['用户体验'], 'compTag': ['130'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '上市公司': {'init': ['-1'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'keyword': ['用户体验'], 'compTag': ['156'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}}\n"
     ]
    }
   ],
   "source": [
    "# 生成城市参数模板  \n",
    "def 参数模板生成(compTag , keyword ):\n",
    "    参数 = 参数模板.copy()  # 复制一份参数模版\n",
    "    参数['compTag'] = compTag\n",
    "    参数['keyword'] = keyword\n",
    "    return (参数)\n",
    "\n",
    "# 赋值：keyword\n",
    "参数_compTag_用户体验 = { k:参数模板生成(compTag = [v], keyword = ['用户体验']) for k,v in 字典_compTag.items()}\n",
    "print(参数_compTag_用户体验)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "# request请求\n",
    "session = HTMLSession()\n",
    "\n",
    "def requests_liepin( url, params):\n",
    "    r = session.get( url , params = payload)\n",
    "\n",
    "    # 先取特定元素, 精准打击其子后辈\n",
    "    主要元素 = r.html.xpath( '//ul[@class=\"sojob-list\"]/li')\n",
    "\n",
    "    # 作为xpath字典，键为我要抓的牛肉名称，值为xpath\n",
    "    dict_xpaths={ \n",
    "        'text': {\n",
    "            'edu':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]',\n",
    "            '经验':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]/following-sibling::span',\n",
    "            '薪水':    '//div[contains(@class,\"job-info\")]/p/span[@class=\"text-warning\"]', \n",
    "            '时间':    '//div[contains(@class,\"job-info\")]/p/time/@title', \n",
    "            '职称':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '行业': '//div[contains(@class,\"job-info\")]/p/a',\n",
    "            '公司名称': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        },\n",
    "        'text_content': {\n",
    "        },\n",
    "        'href': {\n",
    "            '链结':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '公司URL': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        }\n",
    "    }\n",
    "\n",
    "    def get_e_text_content(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [e.xpath(_xpath_)[0].lxml.text_content() for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_text(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [\"\".join([x.strip() if type(x) is str else x.text.strip() for x in e.xpath(_xpath_)]) for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_href(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [list(e.xpath(_xpath_, first=True).absolute_links)[0] \\\n",
    "                   if len(e.xpath(_xpath_, first=True).absolute_links) >= 1  \\\n",
    "                   else \"\" for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    # 只对主要元素下进行.xpath取值\n",
    "    数据字典 = dict()\n",
    "\n",
    "    数据字典 = {k:get_e_text_content(v) for k,v in dict_xpaths['text_content'].items()}\n",
    "    数据字典.update({k:get_e_text(v) for k,v in dict_xpaths['text'].items()})\n",
    "    数据字典.update({k:get_e_href(v) for k,v in dict_xpaths['href'].items()})\n",
    "\n",
    "    数据 = pd.DataFrame(数据字典)\n",
    "    #数据.to_excel(\"20春_Web数据挖掘_week03_liepin.xlsx\", sheet_name=\"搜查结果\")\n",
    "    return (数据)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>edu</th>\n",
       "      <th>经验</th>\n",
       "      <th>薪水</th>\n",
       "      <th>时间</th>\n",
       "      <th>职称</th>\n",
       "      <th>行业</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>链结</th>\n",
       "      <th>公司URL</th>\n",
       "      <th>热门公司类型</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20-30k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>建筑结构工程师</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>天音控股</td>\n",
       "      <td>https://www.liepin.com/job/1926991259.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7954048/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月25日</td>\n",
       "      <td>频道运维岗</td>\n",
       "      <td>济南-高新区</td>\n",
       "      <td>中国重型汽车集团有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927756245.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9739005/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月25日</td>\n",
       "      <td>播音主持岗</td>\n",
       "      <td>济南-高新区</td>\n",
       "      <td>中国重型汽车集团有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927756189.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9739005/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月25日</td>\n",
       "      <td>后期制作岗</td>\n",
       "      <td>济南-高新区</td>\n",
       "      <td>中国重型汽车集团有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927756135.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9739005/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月25日</td>\n",
       "      <td>摄像记者岗</td>\n",
       "      <td>济南-高新区</td>\n",
       "      <td>中国重型汽车集团有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927755771.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9739005/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月25日</td>\n",
       "      <td>律师</td>\n",
       "      <td>大连-金州区</td>\n",
       "      <td>天瑞集团</td>\n",
       "      <td>https://www.liepin.com/job/1927721247.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8946384/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>学历不限</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月24日</td>\n",
       "      <td>律师（青海）</td>\n",
       "      <td>海东</td>\n",
       "      <td>天瑞集团</td>\n",
       "      <td>https://www.liepin.com/job/1927721427.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8946384/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>安装成本高级经理</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>禹洲地产股份有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927695079.shtml</td>\n",
       "      <td>https://www.liepin.com/company/2245242/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>25-35k·16薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>集团总部-云架构管理岗</td>\n",
       "      <td>广州</td>\n",
       "      <td>越秀集团</td>\n",
       "      <td>https://www.liepin.com/job/1927682669.shtml</td>\n",
       "      <td>https://www.liepin.com/company/4585715/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>工程管理总监/经理</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>禹洲地产股份有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927104937.shtml</td>\n",
       "      <td>https://www.liepin.com/company/2245242/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>6-7k·13薪</td>\n",
       "      <td>2020年04月22日</td>\n",
       "      <td>人力资源专员（中关村）</td>\n",
       "      <td></td>\n",
       "      <td>中国国际技术智力合作有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927674527.shtml</td>\n",
       "      <td>https://www.liepin.com/company/1233751/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>11-25k·12薪</td>\n",
       "      <td>2020年04月22日</td>\n",
       "      <td>游戏测试工程师</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>网易集团</td>\n",
       "      <td>https://www.liepin.com/job/1927537007.shtml</td>\n",
       "      <td>https://www.liepin.com/company/5964833/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>2020年04月22日</td>\n",
       "      <td>创意营销策划</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>网易集团</td>\n",
       "      <td>https://www.liepin.com/job/1927536945.shtml</td>\n",
       "      <td>https://www.liepin.com/company/5964833/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-25k·12薪</td>\n",
       "      <td>2020年04月22日</td>\n",
       "      <td>品牌营销经理</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>网易集团</td>\n",
       "      <td>https://www.liepin.com/job/1927536797.shtml</td>\n",
       "      <td>https://www.liepin.com/company/5964833/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>2020年04月22日</td>\n",
       "      <td>公关传播策划</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>网易集团</td>\n",
       "      <td>https://www.liepin.com/job/1927536611.shtml</td>\n",
       "      <td>https://www.liepin.com/company/5964833/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>15-25k·12薪</td>\n",
       "      <td>2020年04月22日</td>\n",
       "      <td>税务管理经理</td>\n",
       "      <td>北京</td>\n",
       "      <td>天狮集团</td>\n",
       "      <td>https://www.liepin.com/job/1927052483.shtml</td>\n",
       "      <td>https://www.liepin.com/company/571564/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月15日</td>\n",
       "      <td>数字版权管理运营</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>网易集团</td>\n",
       "      <td>https://www.liepin.com/job/1927471953.shtml</td>\n",
       "      <td>https://www.liepin.com/company/5964833/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>30-50k·12薪</td>\n",
       "      <td>2020年04月13日</td>\n",
       "      <td>集团总部投资总监</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>禹洲地产股份有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927409715.shtml</td>\n",
       "      <td>https://www.liepin.com/company/2245242/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-25k·13薪</td>\n",
       "      <td>2020年04月13日</td>\n",
       "      <td>高级运维开发工程师</td>\n",
       "      <td>杭州</td>\n",
       "      <td>网易集团</td>\n",
       "      <td>https://www.liepin.com/job/1926674043.shtml</td>\n",
       "      <td>https://www.liepin.com/company/5964833/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月10日</td>\n",
       "      <td>集团总部招采总监</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>禹洲地产股份有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927352801.shtml</td>\n",
       "      <td>https://www.liepin.com/company/2245242/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月07日</td>\n",
       "      <td>营销副总经理</td>\n",
       "      <td>张家口</td>\n",
       "      <td>荣盛房地产发展股份有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927259977.shtml</td>\n",
       "      <td>https://www.liepin.com/company/548548/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>30-50k·12薪</td>\n",
       "      <td>2020年03月31日</td>\n",
       "      <td>运营总监/经理</td>\n",
       "      <td>深圳-西丽</td>\n",
       "      <td>禹洲地产股份有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927104335.shtml</td>\n",
       "      <td>https://www.liepin.com/company/2245242/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20-35k·16薪</td>\n",
       "      <td>2020年03月29日</td>\n",
       "      <td>资深NLP算法工程师/专家</td>\n",
       "      <td>杭州-滨江区</td>\n",
       "      <td>网易集团</td>\n",
       "      <td>https://www.liepin.com/job/1927053241.shtml</td>\n",
       "      <td>https://www.liepin.com/company/5964833/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>长春</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772101.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>石家庄</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772093.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>廊坊</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772089.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>上海</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772081.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>北京</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772075.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>深圳</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772071.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>学历不限</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>知识图谱部_产品研发资深工程师</td>\n",
       "      <td>北京</td>\n",
       "      <td>Baidu</td>\n",
       "      <td>https://www.liepin.com/job/1927772031.shtml</td>\n",
       "      <td>https://www.liepin.com/company/884492/</td>\n",
       "      <td>中国500强</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-15k·13薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>前端开发人员</td>\n",
       "      <td>天津-大王古庄</td>\n",
       "      <td>大禹节水</td>\n",
       "      <td>https://www.liepin.com/job/1927684493.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9135243/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>5-7k·12薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>测试技术员（惠州）</td>\n",
       "      <td>惠州</td>\n",
       "      <td>深圳市豪鹏科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927684487.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7938237/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>中专/中技及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>6-9k·12薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>生产班长（惠州）</td>\n",
       "      <td>惠州</td>\n",
       "      <td>深圳市豪鹏科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927684115.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7938237/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>9-14k·15薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>PQM高级工程师（惠州）</td>\n",
       "      <td>惠州</td>\n",
       "      <td>深圳市豪鹏科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927683679.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7938237/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>20-30k·13薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>运营经理（天猫品牌店）</td>\n",
       "      <td>广州</td>\n",
       "      <td>奥飞</td>\n",
       "      <td>https://www.liepin.com/job/1927613401.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7875551/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>10-15k·13薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>运营经理/主管（天猫店铺运营）</td>\n",
       "      <td>广州</td>\n",
       "      <td>奥飞</td>\n",
       "      <td>https://www.liepin.com/job/1927611411.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7875551/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>工程管理总监/经理</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>禹洲地产股份有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927104937.shtml</td>\n",
       "      <td>https://www.liepin.com/company/2245242/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>5-8k·15薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>财务会计</td>\n",
       "      <td>惠州</td>\n",
       "      <td>深圳市豪鹏科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1925219223.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7938237/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>9-14k·15薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>生产主管（惠州豪鹏）</td>\n",
       "      <td>惠州</td>\n",
       "      <td>深圳市豪鹏科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1923424037.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7938237/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>10-20k·15薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>嵌入式软件开发工程师</td>\n",
       "      <td>宁波</td>\n",
       "      <td>三星医疗</td>\n",
       "      <td>https://www.liepin.com/job/1922772283.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8499408/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>9-12k·12薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>PQE高级工程师（惠州SP）</td>\n",
       "      <td>惠州</td>\n",
       "      <td>深圳市豪鹏科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1915738094.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7938237/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>10-20k·12薪</td>\n",
       "      <td>2020年04月22日</td>\n",
       "      <td>供应链系统开发工程师</td>\n",
       "      <td>泉州-晋江</td>\n",
       "      <td>浔兴拉链</td>\n",
       "      <td>https://www.liepin.com/job/1927642085.shtml</td>\n",
       "      <td>https://www.liepin.com/company/1410212/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>11-25k·12薪</td>\n",
       "      <td>2020年04月22日</td>\n",
       "      <td>游戏测试工程师</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>网易集团</td>\n",
       "      <td>https://www.liepin.com/job/1927537007.shtml</td>\n",
       "      <td>https://www.liepin.com/company/5964833/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>2020年04月22日</td>\n",
       "      <td>创意营销策划</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>网易集团</td>\n",
       "      <td>https://www.liepin.com/job/1927536945.shtml</td>\n",
       "      <td>https://www.liepin.com/company/5964833/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-25k·12薪</td>\n",
       "      <td>2020年04月22日</td>\n",
       "      <td>品牌营销经理</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>网易集团</td>\n",
       "      <td>https://www.liepin.com/job/1927536797.shtml</td>\n",
       "      <td>https://www.liepin.com/company/5964833/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>2020年04月22日</td>\n",
       "      <td>公关传播策划</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>网易集团</td>\n",
       "      <td>https://www.liepin.com/job/1927536611.shtml</td>\n",
       "      <td>https://www.liepin.com/company/5964833/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>8-10k·12薪</td>\n",
       "      <td>2020年04月22日</td>\n",
       "      <td>韩语翻译（惠州）</td>\n",
       "      <td>惠州</td>\n",
       "      <td>深圳市豪鹏科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1924401163.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7938237/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-20k·13薪</td>\n",
       "      <td>2020年04月22日</td>\n",
       "      <td>蔚来顾问</td>\n",
       "      <td>深圳</td>\n",
       "      <td>NIO蔚来</td>\n",
       "      <td>https://www.liepin.com/job/1919502019.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8524725/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月21日</td>\n",
       "      <td>营销策划经理</td>\n",
       "      <td>佛山</td>\n",
       "      <td>万和</td>\n",
       "      <td>https://www.liepin.com/job/1927609819.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7862193/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>15-20k·12薪</td>\n",
       "      <td>2020年04月20日</td>\n",
       "      <td>大数据开发工程师(J11103)</td>\n",
       "      <td>杭州-上城区</td>\n",
       "      <td>微贷</td>\n",
       "      <td>https://www.liepin.com/job/1927574277.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8597281/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>5-8k·12薪</td>\n",
       "      <td>2020年04月17日</td>\n",
       "      <td>法务专员</td>\n",
       "      <td>沈阳-市府</td>\n",
       "      <td>微贷</td>\n",
       "      <td>https://www.liepin.com/job/1927541985.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8597281/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>10-20k·13薪</td>\n",
       "      <td>2020年04月16日</td>\n",
       "      <td>运营经理</td>\n",
       "      <td>佛山-顺德区</td>\n",
       "      <td>万和</td>\n",
       "      <td>https://www.liepin.com/job/1926547347.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7862193/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月15日</td>\n",
       "      <td>数字版权管理运营</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>网易集团</td>\n",
       "      <td>https://www.liepin.com/job/1927471953.shtml</td>\n",
       "      <td>https://www.liepin.com/company/5964833/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>10-13k·12薪</td>\n",
       "      <td>2020年04月15日</td>\n",
       "      <td>法务专员(J11102)</td>\n",
       "      <td>杭州</td>\n",
       "      <td>微贷</td>\n",
       "      <td>https://www.liepin.com/job/1927470925.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8597281/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月15日</td>\n",
       "      <td>税务专员(J11101)</td>\n",
       "      <td>杭州-下城区</td>\n",
       "      <td>微贷</td>\n",
       "      <td>https://www.liepin.com/job/1927470269.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8597281/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月15日</td>\n",
       "      <td>Android工程师(J11100)</td>\n",
       "      <td>杭州-下城区</td>\n",
       "      <td>微贷</td>\n",
       "      <td>https://www.liepin.com/job/1927469381.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8597281/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>16-41k·12薪</td>\n",
       "      <td>2020年04月14日</td>\n",
       "      <td>私人财富管家/私人银行理财经理</td>\n",
       "      <td>太原-三桥</td>\n",
       "      <td>山西证券</td>\n",
       "      <td>https://www.liepin.com/job/1923874779.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8538316/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>30-50k·12薪</td>\n",
       "      <td>2020年04月13日</td>\n",
       "      <td>集团总部投资总监</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>禹洲地产股份有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927409715.shtml</td>\n",
       "      <td>https://www.liepin.com/company/2245242/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-25k·13薪</td>\n",
       "      <td>2020年04月13日</td>\n",
       "      <td>高级运维开发工程师</td>\n",
       "      <td>杭州</td>\n",
       "      <td>网易集团</td>\n",
       "      <td>https://www.liepin.com/job/1926674043.shtml</td>\n",
       "      <td>https://www.liepin.com/company/5964833/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月10日</td>\n",
       "      <td>集团总部招采总监</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>禹洲地产股份有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927352801.shtml</td>\n",
       "      <td>https://www.liepin.com/company/2245242/</td>\n",
       "      <td>上市公司</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>240 rows × 10 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "         edu     经验          薪水           时间                  职称       行业  \\\n",
       "0      本科及以上  5-10年  20-30k·12薪  2020年04月26日             建筑结构工程师   深圳-南山区   \n",
       "1       统招本科   1-3年          面议  2020年04月25日               频道运维岗   济南-高新区   \n",
       "2       统招本科   1-3年          面议  2020年04月25日               播音主持岗   济南-高新区   \n",
       "3       统招本科   1-3年          面议  2020年04月25日               后期制作岗   济南-高新区   \n",
       "4       统招本科   1-3年          面议  2020年04月25日               摄像记者岗   济南-高新区   \n",
       "5      本科及以上  5-10年          面议  2020年04月25日                  律师   大连-金州区   \n",
       "6       学历不限  5-10年          面议  2020年04月24日              律师（青海）       海东   \n",
       "7       统招本科  5-10年          面议  2020年04月23日            安装成本高级经理   深圳-南山区   \n",
       "8      本科及以上  5-10年  25-35k·16薪  2020年04月23日         集团总部-云架构管理岗       广州   \n",
       "9       统招本科  5-10年          面议  2020年04月23日           工程管理总监/经理   深圳-南山区   \n",
       "10     大专及以上   经验不限    6-7k·13薪  2020年04月22日         人力资源专员（中关村）            \n",
       "11      统招本科   1-3年  11-25k·12薪  2020年04月22日             游戏测试工程师   广州-天河区   \n",
       "12      统招本科   3-5年  10-15k·12薪  2020年04月22日              创意营销策划   广州-天河区   \n",
       "13      统招本科   3-5年  15-25k·12薪  2020年04月22日              品牌营销经理   广州-天河区   \n",
       "14      统招本科   1-3年  10-15k·12薪  2020年04月22日              公关传播策划   广州-天河区   \n",
       "15     本科及以上  5-10年  15-25k·12薪  2020年04月22日              税务管理经理       北京   \n",
       "16     本科及以上   经验不限          面议  2020年04月15日            数字版权管理运营   广州-天河区   \n",
       "17      统招本科  5-10年  30-50k·12薪  2020年04月13日            集团总部投资总监   深圳-南山区   \n",
       "18     本科及以上   3-5年  15-25k·13薪  2020年04月13日           高级运维开发工程师       杭州   \n",
       "19      统招本科  5-10年          面议  2020年04月10日            集团总部招采总监   深圳-南山区   \n",
       "20      统招本科   经验不限          面议  2020年04月07日              营销副总经理      张家口   \n",
       "21     本科及以上  5-10年  30-50k·12薪  2020年03月31日             运营总监/经理    深圳-西丽   \n",
       "22      统招本科  5-10年  20-35k·16薪  2020年03月29日       资深NLP算法工程师/专家   杭州-滨江区   \n",
       "23      统招本科  10年以上  20-40k·12薪  2020年04月26日              草坪养护总监       长春   \n",
       "24      统招本科  10年以上  20-40k·12薪  2020年04月26日              草坪养护总监      石家庄   \n",
       "25      统招本科  10年以上  20-40k·12薪  2020年04月26日              草坪养护总监       廊坊   \n",
       "26      统招本科  10年以上  20-40k·12薪  2020年04月26日              草坪养护总监       上海   \n",
       "27      统招本科  10年以上  20-40k·12薪  2020年04月26日              草坪养护总监       北京   \n",
       "28      统招本科  10年以上  20-40k·12薪  2020年04月26日              草坪养护总监       深圳   \n",
       "29      学历不限   经验不限  20-40k·12薪  2020年04月26日     知识图谱部_产品研发资深工程师       北京   \n",
       "..       ...    ...         ...          ...                 ...      ...   \n",
       "10      统招本科   1-3年  10-15k·13薪  2020年04月23日              前端开发人员  天津-大王古庄   \n",
       "11     大专及以上   1-3年    5-7k·12薪  2020年04月23日           测试技术员（惠州）       惠州   \n",
       "12  中专/中技及以上   1-3年    6-9k·12薪  2020年04月23日            生产班长（惠州）       惠州   \n",
       "13     本科及以上   3-5年   9-14k·15薪  2020年04月23日        PQM高级工程师（惠州）       惠州   \n",
       "14     本科及以上   3-5年  20-30k·13薪  2020年04月23日         运营经理（天猫品牌店）       广州   \n",
       "15     大专及以上   3-5年  10-15k·13薪  2020年04月23日     运营经理/主管（天猫店铺运营）       广州   \n",
       "16      统招本科  5-10年          面议  2020年04月23日           工程管理总监/经理   深圳-南山区   \n",
       "17     本科及以上   1-3年    5-8k·15薪  2020年04月23日                财务会计       惠州   \n",
       "18     大专及以上   3-5年   9-14k·15薪  2020年04月23日          生产主管（惠州豪鹏）       惠州   \n",
       "19     本科及以上   3-5年  10-20k·15薪  2020年04月23日          嵌入式软件开发工程师       宁波   \n",
       "20     本科及以上   1-3年   9-12k·12薪  2020年04月23日      PQE高级工程师（惠州SP）       惠州   \n",
       "21      统招本科   3-5年  10-20k·12薪  2020年04月22日          供应链系统开发工程师    泉州-晋江   \n",
       "22      统招本科   1-3年  11-25k·12薪  2020年04月22日             游戏测试工程师   广州-天河区   \n",
       "23      统招本科   3-5年  10-15k·12薪  2020年04月22日              创意营销策划   广州-天河区   \n",
       "24      统招本科   3-5年  15-25k·12薪  2020年04月22日              品牌营销经理   广州-天河区   \n",
       "25      统招本科   1-3年  10-15k·12薪  2020年04月22日              公关传播策划   广州-天河区   \n",
       "26      统招本科   1-3年   8-10k·12薪  2020年04月22日            韩语翻译（惠州）       惠州   \n",
       "27      统招本科   1-3年  10-20k·13薪  2020年04月22日                蔚来顾问       深圳   \n",
       "28     本科及以上  5-10年          面议  2020年04月21日              营销策划经理       佛山   \n",
       "29     本科及以上   1-3年  15-20k·12薪  2020年04月20日    大数据开发工程师(J11103)   杭州-上城区   \n",
       "30      统招本科   3-5年    5-8k·12薪  2020年04月17日                法务专员    沈阳-市府   \n",
       "31     本科及以上   3-5年  10-20k·13薪  2020年04月16日                运营经理   佛山-顺德区   \n",
       "32     本科及以上   经验不限          面议  2020年04月15日            数字版权管理运营   广州-天河区   \n",
       "33     本科及以上   3-5年  10-13k·12薪  2020年04月15日        法务专员(J11102)       杭州   \n",
       "34     本科及以上   3-5年          面议  2020年04月15日        税务专员(J11101)   杭州-下城区   \n",
       "35     大专及以上   3-5年          面议  2020年04月15日  Android工程师(J11100)   杭州-下城区   \n",
       "36      统招本科   3-5年  16-41k·12薪  2020年04月14日     私人财富管家/私人银行理财经理    太原-三桥   \n",
       "37      统招本科  5-10年  30-50k·12薪  2020年04月13日            集团总部投资总监   深圳-南山区   \n",
       "38     本科及以上   3-5年  15-25k·13薪  2020年04月13日           高级运维开发工程师       杭州   \n",
       "39      统招本科  5-10年          面议  2020年04月10日            集团总部招采总监   深圳-南山区   \n",
       "\n",
       "              公司名称                                           链结  \\\n",
       "0             天音控股  https://www.liepin.com/job/1926991259.shtml   \n",
       "1     中国重型汽车集团有限公司  https://www.liepin.com/job/1927756245.shtml   \n",
       "2     中国重型汽车集团有限公司  https://www.liepin.com/job/1927756189.shtml   \n",
       "3     中国重型汽车集团有限公司  https://www.liepin.com/job/1927756135.shtml   \n",
       "4     中国重型汽车集团有限公司  https://www.liepin.com/job/1927755771.shtml   \n",
       "5             天瑞集团  https://www.liepin.com/job/1927721247.shtml   \n",
       "6             天瑞集团  https://www.liepin.com/job/1927721427.shtml   \n",
       "7       禹洲地产股份有限公司  https://www.liepin.com/job/1927695079.shtml   \n",
       "8             越秀集团  https://www.liepin.com/job/1927682669.shtml   \n",
       "9       禹洲地产股份有限公司  https://www.liepin.com/job/1927104937.shtml   \n",
       "10  中国国际技术智力合作有限公司  https://www.liepin.com/job/1927674527.shtml   \n",
       "11            网易集团  https://www.liepin.com/job/1927537007.shtml   \n",
       "12            网易集团  https://www.liepin.com/job/1927536945.shtml   \n",
       "13            网易集团  https://www.liepin.com/job/1927536797.shtml   \n",
       "14            网易集团  https://www.liepin.com/job/1927536611.shtml   \n",
       "15            天狮集团  https://www.liepin.com/job/1927052483.shtml   \n",
       "16            网易集团  https://www.liepin.com/job/1927471953.shtml   \n",
       "17      禹洲地产股份有限公司  https://www.liepin.com/job/1927409715.shtml   \n",
       "18            网易集团  https://www.liepin.com/job/1926674043.shtml   \n",
       "19      禹洲地产股份有限公司  https://www.liepin.com/job/1927352801.shtml   \n",
       "20   荣盛房地产发展股份有限公司  https://www.liepin.com/job/1927259977.shtml   \n",
       "21      禹洲地产股份有限公司  https://www.liepin.com/job/1927104335.shtml   \n",
       "22            网易集团  https://www.liepin.com/job/1927053241.shtml   \n",
       "23            恒大集团  https://www.liepin.com/job/1927772101.shtml   \n",
       "24            恒大集团  https://www.liepin.com/job/1927772093.shtml   \n",
       "25            恒大集团  https://www.liepin.com/job/1927772089.shtml   \n",
       "26            恒大集团  https://www.liepin.com/job/1927772081.shtml   \n",
       "27            恒大集团  https://www.liepin.com/job/1927772075.shtml   \n",
       "28            恒大集团  https://www.liepin.com/job/1927772071.shtml   \n",
       "29           Baidu  https://www.liepin.com/job/1927772031.shtml   \n",
       "..             ...                                          ...   \n",
       "10            大禹节水  https://www.liepin.com/job/1927684493.shtml   \n",
       "11     深圳市豪鹏科技有限公司  https://www.liepin.com/job/1927684487.shtml   \n",
       "12     深圳市豪鹏科技有限公司  https://www.liepin.com/job/1927684115.shtml   \n",
       "13     深圳市豪鹏科技有限公司  https://www.liepin.com/job/1927683679.shtml   \n",
       "14              奥飞  https://www.liepin.com/job/1927613401.shtml   \n",
       "15              奥飞  https://www.liepin.com/job/1927611411.shtml   \n",
       "16      禹洲地产股份有限公司  https://www.liepin.com/job/1927104937.shtml   \n",
       "17     深圳市豪鹏科技有限公司  https://www.liepin.com/job/1925219223.shtml   \n",
       "18     深圳市豪鹏科技有限公司  https://www.liepin.com/job/1923424037.shtml   \n",
       "19            三星医疗  https://www.liepin.com/job/1922772283.shtml   \n",
       "20     深圳市豪鹏科技有限公司  https://www.liepin.com/job/1915738094.shtml   \n",
       "21            浔兴拉链  https://www.liepin.com/job/1927642085.shtml   \n",
       "22            网易集团  https://www.liepin.com/job/1927537007.shtml   \n",
       "23            网易集团  https://www.liepin.com/job/1927536945.shtml   \n",
       "24            网易集团  https://www.liepin.com/job/1927536797.shtml   \n",
       "25            网易集团  https://www.liepin.com/job/1927536611.shtml   \n",
       "26     深圳市豪鹏科技有限公司  https://www.liepin.com/job/1924401163.shtml   \n",
       "27           NIO蔚来  https://www.liepin.com/job/1919502019.shtml   \n",
       "28              万和  https://www.liepin.com/job/1927609819.shtml   \n",
       "29              微贷  https://www.liepin.com/job/1927574277.shtml   \n",
       "30              微贷  https://www.liepin.com/job/1927541985.shtml   \n",
       "31              万和  https://www.liepin.com/job/1926547347.shtml   \n",
       "32            网易集团  https://www.liepin.com/job/1927471953.shtml   \n",
       "33              微贷  https://www.liepin.com/job/1927470925.shtml   \n",
       "34              微贷  https://www.liepin.com/job/1927470269.shtml   \n",
       "35              微贷  https://www.liepin.com/job/1927469381.shtml   \n",
       "36            山西证券  https://www.liepin.com/job/1923874779.shtml   \n",
       "37      禹洲地产股份有限公司  https://www.liepin.com/job/1927409715.shtml   \n",
       "38            网易集团  https://www.liepin.com/job/1926674043.shtml   \n",
       "39      禹洲地产股份有限公司  https://www.liepin.com/job/1927352801.shtml   \n",
       "\n",
       "                                      公司URL  热门公司类型  \n",
       "0   https://www.liepin.com/company/7954048/  中国500强  \n",
       "1   https://www.liepin.com/company/9739005/  中国500强  \n",
       "2   https://www.liepin.com/company/9739005/  中国500强  \n",
       "3   https://www.liepin.com/company/9739005/  中国500强  \n",
       "4   https://www.liepin.com/company/9739005/  中国500强  \n",
       "5   https://www.liepin.com/company/8946384/  中国500强  \n",
       "6   https://www.liepin.com/company/8946384/  中国500强  \n",
       "7   https://www.liepin.com/company/2245242/  中国500强  \n",
       "8   https://www.liepin.com/company/4585715/  中国500强  \n",
       "9   https://www.liepin.com/company/2245242/  中国500强  \n",
       "10  https://www.liepin.com/company/1233751/  中国500强  \n",
       "11  https://www.liepin.com/company/5964833/  中国500强  \n",
       "12  https://www.liepin.com/company/5964833/  中国500强  \n",
       "13  https://www.liepin.com/company/5964833/  中国500强  \n",
       "14  https://www.liepin.com/company/5964833/  中国500强  \n",
       "15   https://www.liepin.com/company/571564/  中国500强  \n",
       "16  https://www.liepin.com/company/5964833/  中国500强  \n",
       "17  https://www.liepin.com/company/2245242/  中国500强  \n",
       "18  https://www.liepin.com/company/5964833/  中国500强  \n",
       "19  https://www.liepin.com/company/2245242/  中国500强  \n",
       "20   https://www.liepin.com/company/548548/  中国500强  \n",
       "21  https://www.liepin.com/company/2245242/  中国500强  \n",
       "22  https://www.liepin.com/company/5964833/  中国500强  \n",
       "23   https://www.liepin.com/company/850378/  中国500强  \n",
       "24   https://www.liepin.com/company/850378/  中国500强  \n",
       "25   https://www.liepin.com/company/850378/  中国500强  \n",
       "26   https://www.liepin.com/company/850378/  中国500强  \n",
       "27   https://www.liepin.com/company/850378/  中国500强  \n",
       "28   https://www.liepin.com/company/850378/  中国500强  \n",
       "29   https://www.liepin.com/company/884492/  中国500强  \n",
       "..                                      ...     ...  \n",
       "10  https://www.liepin.com/company/9135243/    上市公司  \n",
       "11  https://www.liepin.com/company/7938237/    上市公司  \n",
       "12  https://www.liepin.com/company/7938237/    上市公司  \n",
       "13  https://www.liepin.com/company/7938237/    上市公司  \n",
       "14  https://www.liepin.com/company/7875551/    上市公司  \n",
       "15  https://www.liepin.com/company/7875551/    上市公司  \n",
       "16  https://www.liepin.com/company/2245242/    上市公司  \n",
       "17  https://www.liepin.com/company/7938237/    上市公司  \n",
       "18  https://www.liepin.com/company/7938237/    上市公司  \n",
       "19  https://www.liepin.com/company/8499408/    上市公司  \n",
       "20  https://www.liepin.com/company/7938237/    上市公司  \n",
       "21  https://www.liepin.com/company/1410212/    上市公司  \n",
       "22  https://www.liepin.com/company/5964833/    上市公司  \n",
       "23  https://www.liepin.com/company/5964833/    上市公司  \n",
       "24  https://www.liepin.com/company/5964833/    上市公司  \n",
       "25  https://www.liepin.com/company/5964833/    上市公司  \n",
       "26  https://www.liepin.com/company/7938237/    上市公司  \n",
       "27  https://www.liepin.com/company/8524725/    上市公司  \n",
       "28  https://www.liepin.com/company/7862193/    上市公司  \n",
       "29  https://www.liepin.com/company/8597281/    上市公司  \n",
       "30  https://www.liepin.com/company/8597281/    上市公司  \n",
       "31  https://www.liepin.com/company/7862193/    上市公司  \n",
       "32  https://www.liepin.com/company/5964833/    上市公司  \n",
       "33  https://www.liepin.com/company/8597281/    上市公司  \n",
       "34  https://www.liepin.com/company/8597281/    上市公司  \n",
       "35  https://www.liepin.com/company/8597281/    上市公司  \n",
       "36  https://www.liepin.com/company/8538316/    上市公司  \n",
       "37  https://www.liepin.com/company/2245242/    上市公司  \n",
       "38  https://www.liepin.com/company/5964833/    上市公司  \n",
       "39  https://www.liepin.com/company/2245242/    上市公司  \n",
       "\n",
       "[240 rows x 10 columns]"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "url = \"https://www.liepin.com/zhaopin/\"\n",
    "\n",
    "list_df = list()\n",
    "for k,v in 参数_compTag_用户体验.items():\n",
    "    payload = v\n",
    "    df = requests_liepin( url, params = payload)\n",
    "    df = df.assign (热门公司类型 = k)    \n",
    "    list_df.append(df)\n",
    "\n",
    "df_all = pd.concat(list_df)\n",
    "df_all"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "# C-4   输出\n",
    "df_all.to_excel(\"公司类型的数据爬取.xlsx\", sheet_name=\"搜查结果\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 爬取行业数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'互联网/电商': '/zhaopin/?subIndustry=&init=-1&industryType=industry_01&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=040&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '游戏产业': '/zhaopin/?subIndustry=&init=-1&industryType=industry_01&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=420&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '计算机软件': '/zhaopin/?subIndustry=&init=-1&industryType=industry_01&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=010&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " 'IT服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_01&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=030&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '电子/芯片/半导体': '/zhaopin/?subIndustry=&init=-1&industryType=industry_02&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=050&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '通信业': '/zhaopin/?subIndustry=&init=-1&industryType=industry_02&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=060&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '计算机/网络设备': '/zhaopin/?subIndustry=&init=-1&industryType=industry_02&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=020&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '房地产/建筑': '/zhaopin/?subIndustry=&init=-1&industryType=industry_03&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=080&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '规划/设计/装潢': '/zhaopin/?subIndustry=&init=-1&industryType=industry_03&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=100&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '房地产服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_03&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=090&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '银行': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=130&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '保险': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=140&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '基金/证券/投资': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=150&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '会计/审计': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=430&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '信托/担保/拍卖': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=500&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '快消品': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=190&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '批发零售': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=240&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '服装纺织': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=200&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '家具/家电': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=210&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '办公设备': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=220&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '奢侈品/收藏品': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=460&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '珠宝/玩具/工艺品': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=470&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '汽车/摩托车': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=350&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '机械/机电/重工': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=360&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '印刷/包装/造纸': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=180&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '原材料加工': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=370&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '仪器/电气/自动化': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=340&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '制药/生物工程': '/zhaopin/?subIndustry=&init=-1&industryType=industry_10&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=270&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '医疗/保健/美容': '/zhaopin/?subIndustry=&init=-1&industryType=industry_10&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=280&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '医疗器械': '/zhaopin/?subIndustry=&init=-1&industryType=industry_10&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=290&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '能源/水利': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=330&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '石油/化工': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=310&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '采掘/冶炼/矿产': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=320&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '环保': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=300&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '新能源': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=490&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '专业服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=120&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '中介服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=110&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '外包服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=440&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '检测/认证': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=450&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '餐饮/酒旅/服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=230&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '文体娱乐': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=260&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '租赁服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=510&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '广告/市场/会展': '/zhaopin/?subIndustry=&init=-1&industryType=industry_08&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=070&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '影视文化': '/zhaopin/?subIndustry=&init=-1&industryType=industry_08&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=170&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '教育培训': '/zhaopin/?subIndustry=&init=-1&industryType=industry_08&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=380&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '交通/物流/运输': '/zhaopin/?subIndustry=&init=-1&industryType=industry_09&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=250&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '贸易/进出口': '/zhaopin/?subIndustry=&init=-1&industryType=industry_09&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=160&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '航空/航天': '/zhaopin/?subIndustry=&init=-1&industryType=industry_09&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=480&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '政务/公共服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_12&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=390&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '农林牧渔': '/zhaopin/?subIndustry=&init=-1&industryType=industry_12&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=410&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4',\n",
       " '其他行业': '/zhaopin/?subIndustry=&init=-1&industryType=industry_12&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=400&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4'}"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 抓取行业的数据（链接、文本）\n",
    "行业数据选择器链结 = r.html.xpath('//div[@data-selector=\"search-conditions\"]')[0] \\\n",
    "                    .xpath('//dt[@class=\"search-title\"]/following-sibling::dd')[1] \\\n",
    "                    .xpath('//div[contains(@class,\"sub-industry\")]/a')\n",
    "行业数据选择器链结\n",
    "\n",
    "行业数据选择器链结 = { x.xpath(\"a/text()\")[0]:x.xpath(\"a/@href\")[0] for x in 行业数据选择器链结}\n",
    "行业数据选择器链结"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<class 'pandas.core.frame.DataFrame'>\n",
      "RangeIndex: 51 entries, 0 to 50\n",
      "Data columns (total 6 columns):\n",
      "scheme      51 non-null object\n",
      "netloc      51 non-null object\n",
      "path        51 non-null object\n",
      "params      51 non-null object\n",
      "query       51 non-null object\n",
      "fragment    51 non-null object\n",
      "dtypes: object(6)\n",
      "memory usage: 2.5+ KB\n",
      "scheme       1\n",
      "netloc       1\n",
      "path         1\n",
      "params       1\n",
      "query       51\n",
      "fragment     1\n",
      "dtype: int64\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>scheme</th>\n",
       "      <th>netloc</th>\n",
       "      <th>path</th>\n",
       "      <th>params</th>\n",
       "      <th>query</th>\n",
       "      <th>fragment</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>subIndustry=&amp;init=-1&amp;industryType=industry_01&amp;...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "  scheme netloc       path params  \\\n",
       "0                /zhaopin/          \n",
       "\n",
       "                                               query fragment  \n",
       "0  subIndustry=&init=-1&industryType=industry_01&...           "
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from urllib.parse import urlparse, parse_qs\n",
    "\n",
    "df = pd.DataFrame([ urlparse(x) for x in 行业数据选择器链结.values()])\n",
    "df.info()\n",
    "print(df.nunique())\n",
    "df.head(1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "ckid              1\n",
      "d_ckId            1\n",
      "d_curPage         1\n",
      "d_headId          1\n",
      "d_pageSize        1\n",
      "d_sfrom           1\n",
      "flushckid         1\n",
      "fromSearchBtn     1\n",
      "headckid          1\n",
      "industries       51\n",
      "industryType     12\n",
      "init              1\n",
      "keyword           1\n",
      "siTag             1\n",
      "dtype: int64\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>ckid</th>\n",
       "      <th>d_ckId</th>\n",
       "      <th>d_curPage</th>\n",
       "      <th>d_headId</th>\n",
       "      <th>d_pageSize</th>\n",
       "      <th>d_sfrom</th>\n",
       "      <th>flushckid</th>\n",
       "      <th>fromSearchBtn</th>\n",
       "      <th>headckid</th>\n",
       "      <th>industries</th>\n",
       "      <th>industryType</th>\n",
       "      <th>init</th>\n",
       "      <th>keyword</th>\n",
       "      <th>siTag</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>0</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>040</td>\n",
       "      <td>industry_01</td>\n",
       "      <td>-1</td>\n",
       "      <td>人力资源</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>0</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>420</td>\n",
       "      <td>industry_01</td>\n",
       "      <td>-1</td>\n",
       "      <td>人力资源</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>0</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>010</td>\n",
       "      <td>industry_01</td>\n",
       "      <td>-1</td>\n",
       "      <td>人力资源</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>0</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>030</td>\n",
       "      <td>industry_01</td>\n",
       "      <td>-1</td>\n",
       "      <td>人力资源</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>0</td>\n",
       "      <td>521f01d84c3b99bf56614979c8dfdbb4</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>8048cb4ce04891b3</td>\n",
       "      <td>050</td>\n",
       "      <td>industry_02</td>\n",
       "      <td>-1</td>\n",
       "      <td>人力资源</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "               ckid                            d_ckId d_curPage  \\\n",
       "0  8048cb4ce04891b3  521f01d84c3b99bf56614979c8dfdbb4         0   \n",
       "1  8048cb4ce04891b3  521f01d84c3b99bf56614979c8dfdbb4         0   \n",
       "2  8048cb4ce04891b3  521f01d84c3b99bf56614979c8dfdbb4         0   \n",
       "3  8048cb4ce04891b3  521f01d84c3b99bf56614979c8dfdbb4         0   \n",
       "4  8048cb4ce04891b3  521f01d84c3b99bf56614979c8dfdbb4         0   \n",
       "\n",
       "                           d_headId d_pageSize         d_sfrom flushckid  \\\n",
       "0  521f01d84c3b99bf56614979c8dfdbb4         40  search_unknown         1   \n",
       "1  521f01d84c3b99bf56614979c8dfdbb4         40  search_unknown         1   \n",
       "2  521f01d84c3b99bf56614979c8dfdbb4         40  search_unknown         1   \n",
       "3  521f01d84c3b99bf56614979c8dfdbb4         40  search_unknown         1   \n",
       "4  521f01d84c3b99bf56614979c8dfdbb4         40  search_unknown         1   \n",
       "\n",
       "  fromSearchBtn          headckid industries industryType init keyword  \\\n",
       "0             2  8048cb4ce04891b3        040  industry_01   -1    人力资源   \n",
       "1             2  8048cb4ce04891b3        420  industry_01   -1    人力资源   \n",
       "2             2  8048cb4ce04891b3        010  industry_01   -1    人力资源   \n",
       "3             2  8048cb4ce04891b3        030  industry_01   -1    人力资源   \n",
       "4             2  8048cb4ce04891b3        050  industry_02   -1    人力资源   \n",
       "\n",
       "                                           siTag  \n",
       "0  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "1  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "2  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "3  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "4  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  "
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 针对query 再解析之 \n",
    "#df_qs = pd.DataFrame([ parse_qs(x) for x in df['query'] ])\n",
    "df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "print (df_qs.nunique())\n",
    "df_qs.head()\n",
    "# df_qs[['keyword','industries']]  取表格中特定的某个值"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['040'], 'keyword': ['人力资源'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}\n",
      "{'互联网/电商': '040', '游戏产业': '420', '计算机软件': '010', 'IT服务': '030', '电子/芯片/半导体': '050', '通信业': '060', '计算机/网络设备': '020', '房地产/建筑': '080', '规划/设计/装潢': '100', '房地产服务': '090', '银行': '130', '保险': '140', '基金/证券/投资': '150', '会计/审计': '430', '信托/担保/拍卖': '500', '快消品': '190', '批发零售': '240', '服装纺织': '200', '家具/家电': '210', '办公设备': '220', '奢侈品/收藏品': '460', '珠宝/玩具/工艺品': '470', '汽车/摩托车': '350', '机械/机电/重工': '360', '印刷/包装/造纸': '180', '原材料加工': '370', '仪器/电气/自动化': '340', '制药/生物工程': '270', '医疗/保健/美容': '280', '医疗器械': '290', '能源/水利': '330', '石油/化工': '310', '采掘/冶炼/矿产': '320', '环保': '300', '新能源': '490', '专业服务': '120', '中介服务': '110', '外包服务': '440', '检测/认证': '450', '餐饮/酒旅/服务': '230', '文体娱乐': '260', '租赁服务': '510', '广告/市场/会展': '070', '影视文化': '170', '教育培训': '380', '交通/物流/运输': '250', '贸易/进出口': '160', '航空/航天': '480', '政务/公共服务': '390', '农林牧渔': '410', '其他行业': '400'}\n"
     ]
    }
   ],
   "source": [
    "# 建构 参数模板 及 字典_industries\n",
    "def parse_url_qs_for_industries (url):\n",
    "    six_parts = urlparse(url) \n",
    "    out = parse_qs(six_parts.query)\n",
    "    return (out)\n",
    "\n",
    "# parse_url_qs_for_compTag(list(公司数据选择器链结.values())[0])['compTag']\n",
    "参数模板 = parse_url_qs_for_industries(list(行业数据选择器链结.values())[0])\n",
    "print(参数模板)\n",
    "# [ parse_url_qs_for_compTag(x)['compTag'] for x in 公司数据选择器链结.values()]\n",
    "[ parse_url_qs_for_industries(x)['industries'][0] for x in 行业数据选择器链结.values()]\n",
    "\n",
    "字典_industries = { k:parse_url_qs_for_industries(v)['industries'][0] for k,v in 行业数据选择器链结.items()}\n",
    "print (字典_industries)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'互联网/电商': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['040'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '游戏产业': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['420'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '计算机软件': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['010'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, 'IT服务': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['030'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '电子/芯片/半导体': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['050'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '通信业': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['060'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '计算机/网络设备': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['020'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '房地产/建筑': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['080'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '规划/设计/装潢': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['100'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '房地产服务': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['090'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '银行': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['130'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '保险': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['140'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '基金/证券/投资': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['150'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '会计/审计': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['430'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '信托/担保/拍卖': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['500'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '快消品': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['190'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '批发零售': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['240'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '服装纺织': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['200'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '家具/家电': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['210'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '办公设备': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['220'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '奢侈品/收藏品': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['460'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '珠宝/玩具/工艺品': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['470'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '汽车/摩托车': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['350'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '机械/机电/重工': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['360'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '印刷/包装/造纸': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['180'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '原材料加工': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['370'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '仪器/电气/自动化': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['340'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '制药/生物工程': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['270'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '医疗/保健/美容': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['280'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '医疗器械': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['290'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '能源/水利': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['330'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '石油/化工': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['310'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '采掘/冶炼/矿产': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['320'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '环保': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['300'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '新能源': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['490'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '专业服务': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['120'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '中介服务': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['110'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '外包服务': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['440'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '检测/认证': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['450'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '餐饮/酒旅/服务': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['230'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '文体娱乐': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['260'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '租赁服务': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['510'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '广告/市场/会展': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['070'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '影视文化': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['170'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '教育培训': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['380'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '交通/物流/运输': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['250'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '贸易/进出口': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['160'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '航空/航天': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['480'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '政务/公共服务': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['390'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '农林牧渔': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['410'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}, '其他行业': {'init': ['-1'], 'industryType': ['industry_01'], 'headckid': ['8048cb4ce04891b3'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'industries': ['400'], 'keyword': ['用户体验'], 'ckid': ['8048cb4ce04891b3'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['521f01d84c3b99bf56614979c8dfdbb4'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['521f01d84c3b99bf56614979c8dfdbb4']}}"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    }
   ],
   "source": [
    "def 参数模板生成(industries , keyword ):\n",
    "    参数 = 参数模板.copy()\n",
    "    参数['industries'] = industries\n",
    "    参数['keyword'] = keyword\n",
    "    return (参数)\n",
    "\n",
    "参数_industries_用户体验 = { k:参数模板生成(industries = [v], keyword = ['用户体验']) for k,v in 字典_industries.items()}\n",
    "print(参数_industries_用户体验)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'https://www.liepin.com/zhaopin/?init=-1&industryType=industry_01&headckid=8048cb4ce04891b3&flushckid=1&fromSearchBtn=2&industries=170&keyword=%E7%94%A8%E6%88%B7%E4%BD%93%E9%AA%8C&ckid=8048cb4ce04891b3&siTag=1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=521f01d84c3b99bf56614979c8dfdbb4&d_curPage=0&d_pageSize=40&d_headId=521f01d84c3b99bf56614979c8dfdbb4'"
      ]
     },
     "execution_count": 15,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 尝试取其中一个url 查看参数模版是否建构成功\n",
    "url = \"https://www.liepin.com/zhaopin/\"\n",
    "session = HTMLSession()\n",
    "payload = 参数_industries_用户体验['影视文化']\n",
    "r = session.get( url, params = payload)\n",
    "r.url"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [],
   "source": [
    "session = HTMLSession()\n",
    "\n",
    "def requests_liepin( url, params):\n",
    "    r = session.get( url , params = payload)\n",
    "\n",
    "    # 先取特定元素, 精准打击其子后辈\n",
    "    主要元素 = r.html.xpath( '//ul[@class=\"sojob-list\"]/li')\n",
    "\n",
    "    # 作为xpath字典，键为我要抓的牛肉名称，值为xpath\n",
    "    dict_xpaths={ \n",
    "        'text': {\n",
    "            'edu':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]',\n",
    "            '经验':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]/following-sibling::span',\n",
    "            '薪水':    '//div[contains(@class,\"job-info\")]/p/span[@class=\"text-warning\"]', \n",
    "            '时间':    '//div[contains(@class,\"job-info\")]/p/time/@title', \n",
    "            '职称':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '行业': '//div[contains(@class,\"job-info\")]/p/a',\n",
    "            '公司名称': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        },\n",
    "        'text_content': {\n",
    "        },\n",
    "        'href': {\n",
    "            '链结':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '公司URL': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        }\n",
    "    }\n",
    "\n",
    "    def get_e_text_content(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [e.xpath(_xpath_)[0].lxml.text_content() for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_text(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [\"\".join([x.strip() if type(x) is str else x.text.strip() for x in e.xpath(_xpath_)]) for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_href(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [list(e.xpath(_xpath_, first=True).absolute_links)[0] \\\n",
    "                   if len(e.xpath(_xpath_, first=True).absolute_links) >= 1  \\\n",
    "                   else \"\" for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    # 只对主要元素下进行.xpath取值\n",
    "    数据字典 = dict()\n",
    "\n",
    "    数据字典 = {k:get_e_text_content(v) for k,v in dict_xpaths['text_content'].items()}\n",
    "    数据字典.update({k:get_e_text(v) for k,v in dict_xpaths['text'].items()})\n",
    "    数据字典.update({k:get_e_href(v) for k,v in dict_xpaths['href'].items()})\n",
    "\n",
    "    数据 = pd.DataFrame(数据字典)\n",
    "    #数据.to_excel(\"20春_Web数据挖掘_week03_liepin.xlsx\", sheet_name=\"搜查结果\")\n",
    "    return (数据)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>edu</th>\n",
       "      <th>经验</th>\n",
       "      <th>薪水</th>\n",
       "      <th>时间</th>\n",
       "      <th>职称</th>\n",
       "      <th>行业</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>链结</th>\n",
       "      <th>公司URL</th>\n",
       "      <th>热门行业分类</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>30-45k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>大数据开发工程师</td>\n",
       "      <td>上海-浦东新区</td>\n",
       "      <td>上海基分文化传播</td>\n",
       "      <td>https://www.liepin.com/job/1927770805.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8895584/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-30k·14薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>资金业务产品经理</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>畅捷通支付北京</td>\n",
       "      <td>https://www.liepin.com/job/1927767527.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8577672/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>5-7k·13薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>客户专员</td>\n",
       "      <td>上海-杨浦区</td>\n",
       "      <td>京创智汇(上海)物流科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927765811.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10054581/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-30k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>电商天猫京东运营</td>\n",
       "      <td>杭州-南苑</td>\n",
       "      <td>北京海纳世纪科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927760887.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9215228/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>10-20k·13薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>客服主管</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>泽金金服</td>\n",
       "      <td>https://www.liepin.com/job/1927746007.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8787574/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>店铺店长</td>\n",
       "      <td>上海-杨浦区</td>\n",
       "      <td>百合网</td>\n",
       "      <td>https://www.liepin.com/job/1927726909.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10077527/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>18-28k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>政务售前工程师</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>创能科技</td>\n",
       "      <td>https://www.liepin.com/job/1927692139.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7992349/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>区域销售总监/经理</td>\n",
       "      <td>太原-坞城</td>\n",
       "      <td>优网科技</td>\n",
       "      <td>https://www.liepin.com/job/1927690093.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7896274/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>5-8k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>信息流优化师</td>\n",
       "      <td></td>\n",
       "      <td>盛拓传媒</td>\n",
       "      <td>https://www.liepin.com/job/1927688057.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8597194/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>售前金融项目咨询经理/总监</td>\n",
       "      <td></td>\n",
       "      <td>慧科讯业</td>\n",
       "      <td>https://www.liepin.com/job/1927673039.shtml</td>\n",
       "      <td>https://www.liepin.com/company/1199797/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-16k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>资深安卓开发工程师</td>\n",
       "      <td>长沙</td>\n",
       "      <td>湖南岳麓山数据科学与技术研究院有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927660815.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10184205/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>5-10k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>税务会计</td>\n",
       "      <td>深圳-龙华区</td>\n",
       "      <td>佛山市启动成功智能科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927649765.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9762201/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>直播项目专场招聘(汽车电商)</td>\n",
       "      <td>杭州</td>\n",
       "      <td>大搜车</td>\n",
       "      <td>https://www.liepin.com/job/1927615677.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8141158/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>12-20k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>大客户销售/大客户销售总监</td>\n",
       "      <td>广州</td>\n",
       "      <td>大麦信息</td>\n",
       "      <td>https://www.liepin.com/job/1927615367.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7870705/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>8-12k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>出房管家（六险一金&amp;带薪培训）</td>\n",
       "      <td>南京</td>\n",
       "      <td>北京自如生活企业管理有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927570175.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8916470/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>8-10k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>娱乐节目编导</td>\n",
       "      <td>北京</td>\n",
       "      <td>橘子文化</td>\n",
       "      <td>https://www.liepin.com/job/1927470669.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8310595/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>20-40k·13薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>BI工程师</td>\n",
       "      <td>北京</td>\n",
       "      <td>百合网</td>\n",
       "      <td>https://www.liepin.com/job/1927468011.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10077527/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-25k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>推广经理</td>\n",
       "      <td>杭州-滨江区</td>\n",
       "      <td>杭州大热电子商务有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927385183.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9857093/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-25k·13薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>C端产品经理</td>\n",
       "      <td>北京</td>\n",
       "      <td>百合网</td>\n",
       "      <td>https://www.liepin.com/job/1927349661.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10077527/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>12-20k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>资深产品经理</td>\n",
       "      <td>郑州</td>\n",
       "      <td>郑州珑凌科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927310141.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8113931/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>18-28k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>软件售前工程师</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>创能科技</td>\n",
       "      <td>https://www.liepin.com/job/1927297737.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7992349/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>15-30k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>金交所项目市场经理-XMGJ</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>深圳瀚德金融科技控股有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927265957.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9138140/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>7-16k·14薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>高级亚马逊运营专员（储备组长）</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>广州瀚翼扬电子商务有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927163671.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8881741/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-30k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>天猫运营</td>\n",
       "      <td>杭州-南苑</td>\n",
       "      <td>北京海纳世纪科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927036409.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9215228/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>电商运营专员</td>\n",
       "      <td>上海-闵行区</td>\n",
       "      <td>华硕电脑（上海）有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1926477641.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8134688/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>9-15k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>北京</td>\n",
       "      <td>酷划在线</td>\n",
       "      <td>https://www.liepin.com/job/1926294067.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7967239/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td></td>\n",
       "      <td>国汽(北京)智能网联汽车研究院有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1926037471.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9532936/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>招聘专员</td>\n",
       "      <td>上海-闵行区</td>\n",
       "      <td>华硕电脑（上海）有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1925975821.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8134688/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>5-9k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>电商设计/美工/平面设计</td>\n",
       "      <td>上海</td>\n",
       "      <td>优趣汇</td>\n",
       "      <td>https://www.liepin.com/job/1925936685.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8453342/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>15-25k·13薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>财务经理</td>\n",
       "      <td>北京-望京</td>\n",
       "      <td>百合网</td>\n",
       "      <td>https://www.liepin.com/job/1925055847.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10077527/</td>\n",
       "      <td>互联网/电商</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>7-8k·12薪</td>\n",
       "      <td>2020年04月24日</td>\n",
       "      <td>前期与成本控制部经理</td>\n",
       "      <td>来宾</td>\n",
       "      <td>广西来宾国有资本投资运营集团有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1924092973.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10029116/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>5-6k·12薪</td>\n",
       "      <td>2020年04月24日</td>\n",
       "      <td>营销策划主管</td>\n",
       "      <td>来宾</td>\n",
       "      <td>广西来宾国有资本投资运营集团有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1919733241.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10029116/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月24日</td>\n",
       "      <td>桥涵设计工程师</td>\n",
       "      <td>南京-建邺区</td>\n",
       "      <td>苏交科</td>\n",
       "      <td>https://www.liepin.com/job/1927540495.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8445465/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>中新智地-党务文秘专员（中新集团下属公司）</td>\n",
       "      <td>苏州</td>\n",
       "      <td>中新苏州工业园区开发集团股份有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927695151.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8096825/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>8-14k·12薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>财务部 高级执行员/资深执行员</td>\n",
       "      <td>苏州</td>\n",
       "      <td>中新苏州工业园区开发集团股份有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927687865.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8096825/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>7-14k·18薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>招商部 执行员/高级执行员/资深执行员</td>\n",
       "      <td>苏州</td>\n",
       "      <td>中新苏州工业园区开发集团股份有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927687613.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8096825/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>18-22k·12薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>工程技术支持及能源管理经理</td>\n",
       "      <td>上海-静安区</td>\n",
       "      <td>爱玛客</td>\n",
       "      <td>https://www.liepin.com/job/1926893265.shtml</td>\n",
       "      <td>https://www.liepin.com/company/941363/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>8-10k·13薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>A培训讲师</td>\n",
       "      <td>杭州-滨江区</td>\n",
       "      <td>上海比户环保科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1925924485.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9728295/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>25-35k·20薪</td>\n",
       "      <td>2020年04月23日</td>\n",
       "      <td>财务总监</td>\n",
       "      <td>无锡-惠山区</td>\n",
       "      <td>江苏菲沃泰纳米科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1915792154.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9318072/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>30-60k·12薪</td>\n",
       "      <td>2020年04月21日</td>\n",
       "      <td>心理咨询师</td>\n",
       "      <td>上海-松江区</td>\n",
       "      <td>上海戒成健康咨询有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927202691.shtml</td>\n",
       "      <td>https://www.liepin.com/company/12193883/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月21日</td>\n",
       "      <td>总裁秘书</td>\n",
       "      <td>杭州-宁围</td>\n",
       "      <td>博地控股集团有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1922648561.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10041535/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>10-25k·12薪</td>\n",
       "      <td>2020年04月08日</td>\n",
       "      <td>技术研发</td>\n",
       "      <td>青岛</td>\n",
       "      <td>青岛科博制冷设备有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1923230537.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9905465/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>16-25k·12薪</td>\n",
       "      <td>2019年08月20日</td>\n",
       "      <td>销售总监-3</td>\n",
       "      <td>上海</td>\n",
       "      <td>上海星月投资管理有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1922712939.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9627932/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>清远</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772103.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>长春</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772101.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>郑州</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772099.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>济南</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772097.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>潍坊</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772095.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>石家庄</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772093.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>秦皇岛</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772091.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>廊坊</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772089.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>重庆</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772087.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>武汉</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772085.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>南京</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772083.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>上海</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772081.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>大连</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772079.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>天津</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772077.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>北京</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772075.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>珠海</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772073.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>草坪养护总监</td>\n",
       "      <td>深圳</td>\n",
       "      <td>恒大集团</td>\n",
       "      <td>https://www.liepin.com/job/1927772071.shtml</td>\n",
       "      <td>https://www.liepin.com/company/850378/</td>\n",
       "      <td>其他行业</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>2040 rows × 10 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      edu     经验          薪水           时间                     职称       行业  \\\n",
       "0   本科及以上  5-10年  30-45k·16薪  2020年04月26日               大数据开发工程师  上海-浦东新区   \n",
       "1   本科及以上   3-5年  15-30k·14薪  2020年04月26日               资金业务产品经理   深圳-南山区   \n",
       "2   大专及以上   经验不限    5-7k·13薪  2020年04月26日                   客户专员   上海-杨浦区   \n",
       "3   大专及以上   3-5年  15-30k·12薪  2020年04月26日               电商天猫京东运营    杭州-南苑   \n",
       "4   本科及以上   3-5年  10-20k·13薪  2020年04月26日                   客服主管   深圳-南山区   \n",
       "5   大专及以上   1-3年  10-15k·12薪  2020年04月26日                   店铺店长   上海-杨浦区   \n",
       "6   本科及以上  5-10年  18-28k·12薪  2020年04月26日                政务售前工程师   广州-天河区   \n",
       "7   大专及以上   3-5年          面议  2020年04月26日              区域销售总监/经理    太原-坞城   \n",
       "8   大专及以上   经验不限    5-8k·12薪  2020年04月26日                 信息流优化师            \n",
       "9    统招本科  5-10年          面议  2020年04月26日          售前金融项目咨询经理/总监            \n",
       "10   统招本科   1-3年  10-16k·12薪  2020年04月26日              资深安卓开发工程师       长沙   \n",
       "11  大专及以上   1-3年   5-10k·12薪  2020年04月26日                   税务会计   深圳-龙华区   \n",
       "12  大专及以上   经验不限          面议  2020年04月26日         直播项目专场招聘(汽车电商)       杭州   \n",
       "13  大专及以上   3-5年  12-20k·12薪  2020年04月26日          大客户销售/大客户销售总监       广州   \n",
       "14   统招本科   1-3年   8-12k·12薪  2020年04月26日        出房管家（六险一金&带薪培训）       南京   \n",
       "15  本科及以上   1-3年   8-10k·12薪  2020年04月26日                 娱乐节目编导       北京   \n",
       "16  本科及以上   3-5年  20-40k·13薪  2020年04月26日                  BI工程师       北京   \n",
       "17   统招本科   3-5年  15-25k·12薪  2020年04月26日                   推广经理   杭州-滨江区   \n",
       "18  本科及以上   3-5年  15-25k·13薪  2020年04月26日                 C端产品经理       北京   \n",
       "19   统招本科   3-5年  12-20k·12薪  2020年04月26日                 资深产品经理       郑州   \n",
       "20  本科及以上  5-10年  18-28k·12薪  2020年04月26日                软件售前工程师   广州-天河区   \n",
       "21   统招本科  5-10年  15-30k·12薪  2020年04月26日         金交所项目市场经理-XMGJ   深圳-南山区   \n",
       "22  本科及以上   1-3年   7-16k·14薪  2020年04月26日        高级亚马逊运营专员（储备组长）   广州-海珠区   \n",
       "23  大专及以上   3-5年  15-30k·12薪  2020年04月26日                   天猫运营    杭州-南苑   \n",
       "24  本科及以上   经验不限          面议  2020年04月26日                 电商运营专员   上海-闵行区   \n",
       "25   统招本科   1-3年   9-15k·12薪  2020年04月26日                前端开发工程师       北京   \n",
       "26  硕士及以上  5-10年          面议  2020年04月26日                前端开发工程师            \n",
       "27   统招本科   1-3年          面议  2020年04月26日                   招聘专员   上海-闵行区   \n",
       "28  大专及以上   1-3年    5-9k·16薪  2020年04月26日           电商设计/美工/平面设计       上海   \n",
       "29  本科及以上   1-3年  15-25k·13薪  2020年04月26日                   财务经理    北京-望京   \n",
       "..    ...    ...         ...          ...                    ...      ...   \n",
       "10  本科及以上   3-5年    7-8k·12薪  2020年04月24日             前期与成本控制部经理       来宾   \n",
       "11   统招本科   1-3年    5-6k·12薪  2020年04月24日                 营销策划主管       来宾   \n",
       "12  本科及以上   经验不限          面议  2020年04月24日                桥涵设计工程师   南京-建邺区   \n",
       "13   统招本科   3-5年          面议  2020年04月23日  中新智地-党务文秘专员（中新集团下属公司）       苏州   \n",
       "14  硕士及以上  5-10年   8-14k·12薪  2020年04月23日        财务部 高级执行员/资深执行员       苏州   \n",
       "15  硕士及以上   3-5年   7-14k·18薪  2020年04月23日    招商部 执行员/高级执行员/资深执行员       苏州   \n",
       "16   统招本科  5-10年  18-22k·12薪  2020年04月23日          工程技术支持及能源管理经理   上海-静安区   \n",
       "17  大专及以上   1-3年   8-10k·13薪  2020年04月23日                  A培训讲师   杭州-滨江区   \n",
       "18  本科及以上  10年以上  25-35k·20薪  2020年04月23日                   财务总监   无锡-惠山区   \n",
       "19  大专及以上   3-5年  30-60k·12薪  2020年04月21日                  心理咨询师   上海-松江区   \n",
       "20  硕士及以上   经验不限          面议  2020年04月21日                   总裁秘书    杭州-宁围   \n",
       "21  本科及以上  5-10年  10-25k·12薪  2020年04月08日                   技术研发       青岛   \n",
       "22  大专及以上  5-10年  16-25k·12薪  2019年08月20日                 销售总监-3       上海   \n",
       "23   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       清远   \n",
       "24   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       长春   \n",
       "25   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       郑州   \n",
       "26   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       济南   \n",
       "27   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       潍坊   \n",
       "28   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监      石家庄   \n",
       "29   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监      秦皇岛   \n",
       "30   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       廊坊   \n",
       "31   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       重庆   \n",
       "32   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       武汉   \n",
       "33   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       南京   \n",
       "34   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       上海   \n",
       "35   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       大连   \n",
       "36   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       天津   \n",
       "37   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       北京   \n",
       "38   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       珠海   \n",
       "39   统招本科  10年以上  20-40k·12薪  2020年04月26日                 草坪养护总监       深圳   \n",
       "\n",
       "                   公司名称                                           链结  \\\n",
       "0              上海基分文化传播  https://www.liepin.com/job/1927770805.shtml   \n",
       "1               畅捷通支付北京  https://www.liepin.com/job/1927767527.shtml   \n",
       "2      京创智汇(上海)物流科技有限公司  https://www.liepin.com/job/1927765811.shtml   \n",
       "3          北京海纳世纪科技有限公司  https://www.liepin.com/job/1927760887.shtml   \n",
       "4                  泽金金服  https://www.liepin.com/job/1927746007.shtml   \n",
       "5                   百合网  https://www.liepin.com/job/1927726909.shtml   \n",
       "6                  创能科技  https://www.liepin.com/job/1927692139.shtml   \n",
       "7                  优网科技  https://www.liepin.com/job/1927690093.shtml   \n",
       "8                  盛拓传媒  https://www.liepin.com/job/1927688057.shtml   \n",
       "9                  慧科讯业  https://www.liepin.com/job/1927673039.shtml   \n",
       "10  湖南岳麓山数据科学与技术研究院有限公司  https://www.liepin.com/job/1927660815.shtml   \n",
       "11      佛山市启动成功智能科技有限公司  https://www.liepin.com/job/1927649765.shtml   \n",
       "12                  大搜车  https://www.liepin.com/job/1927615677.shtml   \n",
       "13                 大麦信息  https://www.liepin.com/job/1927615367.shtml   \n",
       "14       北京自如生活企业管理有限公司  https://www.liepin.com/job/1927570175.shtml   \n",
       "15                 橘子文化  https://www.liepin.com/job/1927470669.shtml   \n",
       "16                  百合网  https://www.liepin.com/job/1927468011.shtml   \n",
       "17         杭州大热电子商务有限公司  https://www.liepin.com/job/1927385183.shtml   \n",
       "18                  百合网  https://www.liepin.com/job/1927349661.shtml   \n",
       "19           郑州珑凌科技有限公司  https://www.liepin.com/job/1927310141.shtml   \n",
       "20                 创能科技  https://www.liepin.com/job/1927297737.shtml   \n",
       "21       深圳瀚德金融科技控股有限公司  https://www.liepin.com/job/1927265957.shtml   \n",
       "22        广州瀚翼扬电子商务有限公司  https://www.liepin.com/job/1927163671.shtml   \n",
       "23         北京海纳世纪科技有限公司  https://www.liepin.com/job/1927036409.shtml   \n",
       "24         华硕电脑（上海）有限公司  https://www.liepin.com/job/1926477641.shtml   \n",
       "25                 酷划在线  https://www.liepin.com/job/1926294067.shtml   \n",
       "26  国汽(北京)智能网联汽车研究院有限公司  https://www.liepin.com/job/1926037471.shtml   \n",
       "27         华硕电脑（上海）有限公司  https://www.liepin.com/job/1925975821.shtml   \n",
       "28                  优趣汇  https://www.liepin.com/job/1925936685.shtml   \n",
       "29                  百合网  https://www.liepin.com/job/1925055847.shtml   \n",
       "..                  ...                                          ...   \n",
       "10   广西来宾国有资本投资运营集团有限公司  https://www.liepin.com/job/1924092973.shtml   \n",
       "11   广西来宾国有资本投资运营集团有限公司  https://www.liepin.com/job/1919733241.shtml   \n",
       "12                  苏交科  https://www.liepin.com/job/1927540495.shtml   \n",
       "13   中新苏州工业园区开发集团股份有限公司  https://www.liepin.com/job/1927695151.shtml   \n",
       "14   中新苏州工业园区开发集团股份有限公司  https://www.liepin.com/job/1927687865.shtml   \n",
       "15   中新苏州工业园区开发集团股份有限公司  https://www.liepin.com/job/1927687613.shtml   \n",
       "16                  爱玛客  https://www.liepin.com/job/1926893265.shtml   \n",
       "17         上海比户环保科技有限公司  https://www.liepin.com/job/1925924485.shtml   \n",
       "18        江苏菲沃泰纳米科技有限公司  https://www.liepin.com/job/1915792154.shtml   \n",
       "19         上海戒成健康咨询有限公司  https://www.liepin.com/job/1927202691.shtml   \n",
       "20           博地控股集团有限公司  https://www.liepin.com/job/1922648561.shtml   \n",
       "21         青岛科博制冷设备有限公司  https://www.liepin.com/job/1923230537.shtml   \n",
       "22         上海星月投资管理有限公司  https://www.liepin.com/job/1922712939.shtml   \n",
       "23                 恒大集团  https://www.liepin.com/job/1927772103.shtml   \n",
       "24                 恒大集团  https://www.liepin.com/job/1927772101.shtml   \n",
       "25                 恒大集团  https://www.liepin.com/job/1927772099.shtml   \n",
       "26                 恒大集团  https://www.liepin.com/job/1927772097.shtml   \n",
       "27                 恒大集团  https://www.liepin.com/job/1927772095.shtml   \n",
       "28                 恒大集团  https://www.liepin.com/job/1927772093.shtml   \n",
       "29                 恒大集团  https://www.liepin.com/job/1927772091.shtml   \n",
       "30                 恒大集团  https://www.liepin.com/job/1927772089.shtml   \n",
       "31                 恒大集团  https://www.liepin.com/job/1927772087.shtml   \n",
       "32                 恒大集团  https://www.liepin.com/job/1927772085.shtml   \n",
       "33                 恒大集团  https://www.liepin.com/job/1927772083.shtml   \n",
       "34                 恒大集团  https://www.liepin.com/job/1927772081.shtml   \n",
       "35                 恒大集团  https://www.liepin.com/job/1927772079.shtml   \n",
       "36                 恒大集团  https://www.liepin.com/job/1927772077.shtml   \n",
       "37                 恒大集团  https://www.liepin.com/job/1927772075.shtml   \n",
       "38                 恒大集团  https://www.liepin.com/job/1927772073.shtml   \n",
       "39                 恒大集团  https://www.liepin.com/job/1927772071.shtml   \n",
       "\n",
       "                                       公司URL  热门行业分类  \n",
       "0    https://www.liepin.com/company/8895584/  互联网/电商  \n",
       "1    https://www.liepin.com/company/8577672/  互联网/电商  \n",
       "2   https://www.liepin.com/company/10054581/  互联网/电商  \n",
       "3    https://www.liepin.com/company/9215228/  互联网/电商  \n",
       "4    https://www.liepin.com/company/8787574/  互联网/电商  \n",
       "5   https://www.liepin.com/company/10077527/  互联网/电商  \n",
       "6    https://www.liepin.com/company/7992349/  互联网/电商  \n",
       "7    https://www.liepin.com/company/7896274/  互联网/电商  \n",
       "8    https://www.liepin.com/company/8597194/  互联网/电商  \n",
       "9    https://www.liepin.com/company/1199797/  互联网/电商  \n",
       "10  https://www.liepin.com/company/10184205/  互联网/电商  \n",
       "11   https://www.liepin.com/company/9762201/  互联网/电商  \n",
       "12   https://www.liepin.com/company/8141158/  互联网/电商  \n",
       "13   https://www.liepin.com/company/7870705/  互联网/电商  \n",
       "14   https://www.liepin.com/company/8916470/  互联网/电商  \n",
       "15   https://www.liepin.com/company/8310595/  互联网/电商  \n",
       "16  https://www.liepin.com/company/10077527/  互联网/电商  \n",
       "17   https://www.liepin.com/company/9857093/  互联网/电商  \n",
       "18  https://www.liepin.com/company/10077527/  互联网/电商  \n",
       "19   https://www.liepin.com/company/8113931/  互联网/电商  \n",
       "20   https://www.liepin.com/company/7992349/  互联网/电商  \n",
       "21   https://www.liepin.com/company/9138140/  互联网/电商  \n",
       "22   https://www.liepin.com/company/8881741/  互联网/电商  \n",
       "23   https://www.liepin.com/company/9215228/  互联网/电商  \n",
       "24   https://www.liepin.com/company/8134688/  互联网/电商  \n",
       "25   https://www.liepin.com/company/7967239/  互联网/电商  \n",
       "26   https://www.liepin.com/company/9532936/  互联网/电商  \n",
       "27   https://www.liepin.com/company/8134688/  互联网/电商  \n",
       "28   https://www.liepin.com/company/8453342/  互联网/电商  \n",
       "29  https://www.liepin.com/company/10077527/  互联网/电商  \n",
       "..                                       ...     ...  \n",
       "10  https://www.liepin.com/company/10029116/    其他行业  \n",
       "11  https://www.liepin.com/company/10029116/    其他行业  \n",
       "12   https://www.liepin.com/company/8445465/    其他行业  \n",
       "13   https://www.liepin.com/company/8096825/    其他行业  \n",
       "14   https://www.liepin.com/company/8096825/    其他行业  \n",
       "15   https://www.liepin.com/company/8096825/    其他行业  \n",
       "16    https://www.liepin.com/company/941363/    其他行业  \n",
       "17   https://www.liepin.com/company/9728295/    其他行业  \n",
       "18   https://www.liepin.com/company/9318072/    其他行业  \n",
       "19  https://www.liepin.com/company/12193883/    其他行业  \n",
       "20  https://www.liepin.com/company/10041535/    其他行业  \n",
       "21   https://www.liepin.com/company/9905465/    其他行业  \n",
       "22   https://www.liepin.com/company/9627932/    其他行业  \n",
       "23    https://www.liepin.com/company/850378/    其他行业  \n",
       "24    https://www.liepin.com/company/850378/    其他行业  \n",
       "25    https://www.liepin.com/company/850378/    其他行业  \n",
       "26    https://www.liepin.com/company/850378/    其他行业  \n",
       "27    https://www.liepin.com/company/850378/    其他行业  \n",
       "28    https://www.liepin.com/company/850378/    其他行业  \n",
       "29    https://www.liepin.com/company/850378/    其他行业  \n",
       "30    https://www.liepin.com/company/850378/    其他行业  \n",
       "31    https://www.liepin.com/company/850378/    其他行业  \n",
       "32    https://www.liepin.com/company/850378/    其他行业  \n",
       "33    https://www.liepin.com/company/850378/    其他行业  \n",
       "34    https://www.liepin.com/company/850378/    其他行业  \n",
       "35    https://www.liepin.com/company/850378/    其他行业  \n",
       "36    https://www.liepin.com/company/850378/    其他行业  \n",
       "37    https://www.liepin.com/company/850378/    其他行业  \n",
       "38    https://www.liepin.com/company/850378/    其他行业  \n",
       "39    https://www.liepin.com/company/850378/    其他行业  \n",
       "\n",
       "[2040 rows x 10 columns]"
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "url = \"https://www.liepin.com/zhaopin/\"\n",
    "\n",
    "list_df = list()\n",
    "for k,v in 参数_industries_用户体验.items():\n",
    "    payload = v\n",
    "    df = requests_liepin( url, params = payload)\n",
    "    df = df.assign (热门行业分类 = k)    \n",
    "    list_df.append(df)\n",
    "\n",
    "df_all = pd.concat(list_df)\n",
    "df_all"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {},
   "outputs": [],
   "source": [
    "# C-4   输出\n",
    "df_all.to_excel(\"行业类型的数据爬取.xlsx\", sheet_name=\"搜查结果\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 爬取城市数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'全国': '/zhaopin/?init=-1&headckid=626dafaeb873247b&flushckid=1&fromSearchBtn=2&dqs=&keyword=%E9%94%80%E5%94%AE&ckid=626dafaeb873247b&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=4868162b76df5d62239cc742803b716c&d_curPage=0&d_pageSize=40&d_headId=4868162b76df5d62239cc742803b716c',\n",
       " '北京': '/zhaopin/?init=-1&headckid=626dafaeb873247b&flushckid=1&fromSearchBtn=2&dqs=010&keyword=%E9%94%80%E5%94%AE&ckid=626dafaeb873247b&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=4868162b76df5d62239cc742803b716c&d_curPage=0&d_pageSize=40&d_headId=4868162b76df5d62239cc742803b716c',\n",
       " '上海': '/zhaopin/?init=-1&headckid=626dafaeb873247b&flushckid=1&fromSearchBtn=2&dqs=020&keyword=%E9%94%80%E5%94%AE&ckid=626dafaeb873247b&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=4868162b76df5d62239cc742803b716c&d_curPage=0&d_pageSize=40&d_headId=4868162b76df5d62239cc742803b716c',\n",
       " '广州': '/zhaopin/?init=-1&headckid=626dafaeb873247b&flushckid=1&fromSearchBtn=2&dqs=050020&keyword=%E9%94%80%E5%94%AE&ckid=626dafaeb873247b&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=4868162b76df5d62239cc742803b716c&d_curPage=0&d_pageSize=40&d_headId=4868162b76df5d62239cc742803b716c',\n",
       " '深圳': '/zhaopin/?init=-1&headckid=626dafaeb873247b&flushckid=1&fromSearchBtn=2&dqs=050090&keyword=%E9%94%80%E5%94%AE&ckid=626dafaeb873247b&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=4868162b76df5d62239cc742803b716c&d_curPage=0&d_pageSize=40&d_headId=4868162b76df5d62239cc742803b716c',\n",
       " '天津': '/zhaopin/?init=-1&headckid=626dafaeb873247b&flushckid=1&fromSearchBtn=2&dqs=030&keyword=%E9%94%80%E5%94%AE&ckid=626dafaeb873247b&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=4868162b76df5d62239cc742803b716c&d_curPage=0&d_pageSize=40&d_headId=4868162b76df5d62239cc742803b716c',\n",
       " '苏州': '/zhaopin/?init=-1&headckid=626dafaeb873247b&flushckid=1&fromSearchBtn=2&dqs=060080&keyword=%E9%94%80%E5%94%AE&ckid=626dafaeb873247b&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=4868162b76df5d62239cc742803b716c&d_curPage=0&d_pageSize=40&d_headId=4868162b76df5d62239cc742803b716c',\n",
       " '重庆': '/zhaopin/?init=-1&headckid=626dafaeb873247b&flushckid=1&fromSearchBtn=2&dqs=040&keyword=%E9%94%80%E5%94%AE&ckid=626dafaeb873247b&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=4868162b76df5d62239cc742803b716c&d_curPage=0&d_pageSize=40&d_headId=4868162b76df5d62239cc742803b716c',\n",
       " '南京': '/zhaopin/?init=-1&headckid=626dafaeb873247b&flushckid=1&fromSearchBtn=2&dqs=060020&keyword=%E9%94%80%E5%94%AE&ckid=626dafaeb873247b&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=4868162b76df5d62239cc742803b716c&d_curPage=0&d_pageSize=40&d_headId=4868162b76df5d62239cc742803b716c',\n",
       " '杭州': '/zhaopin/?init=-1&headckid=626dafaeb873247b&flushckid=1&fromSearchBtn=2&dqs=070020&keyword=%E9%94%80%E5%94%AE&ckid=626dafaeb873247b&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=4868162b76df5d62239cc742803b716c&d_curPage=0&d_pageSize=40&d_headId=4868162b76df5d62239cc742803b716c',\n",
       " '大连': '/zhaopin/?init=-1&headckid=626dafaeb873247b&flushckid=1&fromSearchBtn=2&dqs=210040&keyword=%E9%94%80%E5%94%AE&ckid=626dafaeb873247b&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=4868162b76df5d62239cc742803b716c&d_curPage=0&d_pageSize=40&d_headId=4868162b76df5d62239cc742803b716c',\n",
       " '成都': '/zhaopin/?init=-1&headckid=626dafaeb873247b&flushckid=1&fromSearchBtn=2&dqs=280020&keyword=%E9%94%80%E5%94%AE&ckid=626dafaeb873247b&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=4868162b76df5d62239cc742803b716c&d_curPage=0&d_pageSize=40&d_headId=4868162b76df5d62239cc742803b716c',\n",
       " '武汉': '/zhaopin/?init=-1&headckid=626dafaeb873247b&flushckid=1&fromSearchBtn=2&dqs=170020&keyword=%E9%94%80%E5%94%AE&ckid=626dafaeb873247b&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=4868162b76df5d62239cc742803b716c&d_curPage=0&d_pageSize=40&d_headId=4868162b76df5d62239cc742803b716c',\n",
       " '其他': 'javascript:;'}"
      ]
     },
     "execution_count": 20,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 对城市分类的数据（链接、文本）抓取\n",
    "import pandas as pd\n",
    "from requests_html import HTMLSession\n",
    "\n",
    "url = \"https://www.liepin.com/zhaopin/?keyword=销售\"\n",
    "session = HTMLSession()\n",
    "r = session.get( url )\n",
    "\n",
    "城市链接 = r.html.xpath('//div[@data-selector=\"search-conditions\"]')[0] \\\n",
    "                    .xpath('//dt[@class=\"search-title\"]/following-sibling::dd')[2] \\\n",
    "                    .xpath('//a/@href')\n",
    "城市文本 = r.html.xpath('//div[@data-selector=\"search-conditions\"]')[0] \\\n",
    "                 .xpath('//dt[@class=\"search-title\"]/following-sibling::dd')[2] \\\n",
    "                  .xpath('//a/text()')\n",
    "\n",
    "城市数据选择器链结 = dict(zip(城市文本,城市链接))\n",
    "城市数据选择器链结"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<class 'pandas.core.frame.DataFrame'>\n",
      "RangeIndex: 14 entries, 0 to 13\n",
      "Data columns (total 6 columns):\n",
      "scheme      14 non-null object\n",
      "netloc      14 non-null object\n",
      "path        14 non-null object\n",
      "params      14 non-null object\n",
      "query       14 non-null object\n",
      "fragment    14 non-null object\n",
      "dtypes: object(6)\n",
      "memory usage: 752.0+ bytes\n",
      "scheme       2\n",
      "netloc       1\n",
      "path         2\n",
      "params       1\n",
      "query       14\n",
      "fragment     1\n",
      "dtype: int64\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>scheme</th>\n",
       "      <th>netloc</th>\n",
       "      <th>path</th>\n",
       "      <th>params</th>\n",
       "      <th>query</th>\n",
       "      <th>fragment</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;headckid=626dafaeb873247b&amp;flushckid=1&amp;...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;headckid=626dafaeb873247b&amp;flushckid=1&amp;...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;headckid=626dafaeb873247b&amp;flushckid=1&amp;...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;headckid=626dafaeb873247b&amp;flushckid=1&amp;...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;headckid=626dafaeb873247b&amp;flushckid=1&amp;...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "  scheme netloc       path params  \\\n",
       "0                /zhaopin/          \n",
       "1                /zhaopin/          \n",
       "2                /zhaopin/          \n",
       "3                /zhaopin/          \n",
       "4                /zhaopin/          \n",
       "\n",
       "                                               query fragment  \n",
       "0  init=-1&headckid=626dafaeb873247b&flushckid=1&...           \n",
       "1  init=-1&headckid=626dafaeb873247b&flushckid=1&...           \n",
       "2  init=-1&headckid=626dafaeb873247b&flushckid=1&...           \n",
       "3  init=-1&headckid=626dafaeb873247b&flushckid=1&...           \n",
       "4  init=-1&headckid=626dafaeb873247b&flushckid=1&...           "
      ]
     },
     "execution_count": 21,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 解析url\n",
    "from urllib.parse import urlparse, parse_qs\n",
    "\n",
    "df = pd.DataFrame([ urlparse(x) for x in 城市数据选择器链结.values()])\n",
    "df.info()\n",
    "print(df.nunique())\n",
    "df.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "ckid              1\n",
      "d_ckId            1\n",
      "d_curPage         1\n",
      "d_headId          1\n",
      "d_pageSize        1\n",
      "d_sfrom           1\n",
      "dqs              12\n",
      "flushckid         1\n",
      "fromSearchBtn     1\n",
      "headckid          1\n",
      "init              1\n",
      "keyword           1\n",
      "siTag             1\n",
      "dtype: int64\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>ckid</th>\n",
       "      <th>d_ckId</th>\n",
       "      <th>d_curPage</th>\n",
       "      <th>d_headId</th>\n",
       "      <th>d_pageSize</th>\n",
       "      <th>d_sfrom</th>\n",
       "      <th>dqs</th>\n",
       "      <th>flushckid</th>\n",
       "      <th>fromSearchBtn</th>\n",
       "      <th>headckid</th>\n",
       "      <th>init</th>\n",
       "      <th>keyword</th>\n",
       "      <th>siTag</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>0</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>-1</td>\n",
       "      <td>销售</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>0</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>010</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>-1</td>\n",
       "      <td>销售</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>0</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>020</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>-1</td>\n",
       "      <td>销售</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>0</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>050020</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>-1</td>\n",
       "      <td>销售</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>0</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>050090</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>-1</td>\n",
       "      <td>销售</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>0</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>030</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>-1</td>\n",
       "      <td>销售</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>0</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>060080</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>-1</td>\n",
       "      <td>销售</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>0</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>040</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>-1</td>\n",
       "      <td>销售</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>0</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>060020</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>-1</td>\n",
       "      <td>销售</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>0</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>070020</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>-1</td>\n",
       "      <td>销售</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>0</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>210040</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>-1</td>\n",
       "      <td>销售</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>0</td>\n",
       "      <td>4868162b76df5d62239cc742803b716c</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>280020</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>626dafaeb873247b</td>\n",
       "      <td>-1</td>\n",
       "      <td>销售</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                ckid                            d_ckId d_curPage  \\\n",
       "0   626dafaeb873247b  4868162b76df5d62239cc742803b716c         0   \n",
       "1   626dafaeb873247b  4868162b76df5d62239cc742803b716c         0   \n",
       "2   626dafaeb873247b  4868162b76df5d62239cc742803b716c         0   \n",
       "3   626dafaeb873247b  4868162b76df5d62239cc742803b716c         0   \n",
       "4   626dafaeb873247b  4868162b76df5d62239cc742803b716c         0   \n",
       "5   626dafaeb873247b  4868162b76df5d62239cc742803b716c         0   \n",
       "6   626dafaeb873247b  4868162b76df5d62239cc742803b716c         0   \n",
       "7   626dafaeb873247b  4868162b76df5d62239cc742803b716c         0   \n",
       "8   626dafaeb873247b  4868162b76df5d62239cc742803b716c         0   \n",
       "9   626dafaeb873247b  4868162b76df5d62239cc742803b716c         0   \n",
       "10  626dafaeb873247b  4868162b76df5d62239cc742803b716c         0   \n",
       "11  626dafaeb873247b  4868162b76df5d62239cc742803b716c         0   \n",
       "\n",
       "                            d_headId d_pageSize         d_sfrom     dqs  \\\n",
       "0   4868162b76df5d62239cc742803b716c         40  search_unknown     NaN   \n",
       "1   4868162b76df5d62239cc742803b716c         40  search_unknown     010   \n",
       "2   4868162b76df5d62239cc742803b716c         40  search_unknown     020   \n",
       "3   4868162b76df5d62239cc742803b716c         40  search_unknown  050020   \n",
       "4   4868162b76df5d62239cc742803b716c         40  search_unknown  050090   \n",
       "5   4868162b76df5d62239cc742803b716c         40  search_unknown     030   \n",
       "6   4868162b76df5d62239cc742803b716c         40  search_unknown  060080   \n",
       "7   4868162b76df5d62239cc742803b716c         40  search_unknown     040   \n",
       "8   4868162b76df5d62239cc742803b716c         40  search_unknown  060020   \n",
       "9   4868162b76df5d62239cc742803b716c         40  search_unknown  070020   \n",
       "10  4868162b76df5d62239cc742803b716c         40  search_unknown  210040   \n",
       "11  4868162b76df5d62239cc742803b716c         40  search_unknown  280020   \n",
       "\n",
       "   flushckid fromSearchBtn          headckid init keyword  \\\n",
       "0          1             2  626dafaeb873247b   -1      销售   \n",
       "1          1             2  626dafaeb873247b   -1      销售   \n",
       "2          1             2  626dafaeb873247b   -1      销售   \n",
       "3          1             2  626dafaeb873247b   -1      销售   \n",
       "4          1             2  626dafaeb873247b   -1      销售   \n",
       "5          1             2  626dafaeb873247b   -1      销售   \n",
       "6          1             2  626dafaeb873247b   -1      销售   \n",
       "7          1             2  626dafaeb873247b   -1      销售   \n",
       "8          1             2  626dafaeb873247b   -1      销售   \n",
       "9          1             2  626dafaeb873247b   -1      销售   \n",
       "10         1             2  626dafaeb873247b   -1      销售   \n",
       "11         1             2  626dafaeb873247b   -1      销售   \n",
       "\n",
       "                                            siTag  \n",
       "0   1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "1   1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "2   1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "3   1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "4   1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "5   1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "6   1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "7   1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "8   1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "9   1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "10  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "11  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  "
      ]
     },
     "execution_count": 22,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# B-3 针对query 再解析之 \n",
    "#df_qs = pd.DataFrame([ parse_qs(x) for x in df['query'] ])\n",
    "df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "print (df_qs.nunique())\n",
    "df_qs.head(12)\n",
    "# df_qs[['keyword','industries']]  取表格中特定的某个值"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>keyword</th>\n",
       "      <th>dqs</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>销售</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>销售</td>\n",
       "      <td>010</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>销售</td>\n",
       "      <td>020</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>销售</td>\n",
       "      <td>050020</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>销售</td>\n",
       "      <td>050090</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>销售</td>\n",
       "      <td>030</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>销售</td>\n",
       "      <td>060080</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>销售</td>\n",
       "      <td>040</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>销售</td>\n",
       "      <td>060020</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>销售</td>\n",
       "      <td>070020</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>销售</td>\n",
       "      <td>210040</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>销售</td>\n",
       "      <td>280020</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>销售</td>\n",
       "      <td>170020</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   keyword     dqs\n",
       "0       销售     NaN\n",
       "1       销售     010\n",
       "2       销售     020\n",
       "3       销售  050020\n",
       "4       销售  050090\n",
       "5       销售     030\n",
       "6       销售  060080\n",
       "7       销售     040\n",
       "8       销售  060020\n",
       "9       销售  070020\n",
       "10      销售  210040\n",
       "11      销售  280020\n",
       "12      销售  170020\n",
       "13     NaN     NaN"
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_qs[['keyword','dqs']] #取表格中特定的某个值"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 爬取薪资数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'10-15万': '/zhaopin/?init=-1&salary=10$15&ckid=efd12b7a4c45b51d&headckid=efd12b7a4c45b51d&flushckid=1&fromSearchBtn=2&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=f54d8a69399c8673c64d9dbb3dc3d13e&d_curPage=0&d_pageSize=40&d_headId=f54d8a69399c8673c64d9dbb3dc3d13e',\n",
       " '15-20万': '/zhaopin/?init=-1&salary=15$20&ckid=efd12b7a4c45b51d&headckid=efd12b7a4c45b51d&flushckid=1&fromSearchBtn=2&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=f54d8a69399c8673c64d9dbb3dc3d13e&d_curPage=0&d_pageSize=40&d_headId=f54d8a69399c8673c64d9dbb3dc3d13e',\n",
       " '20-30万': '/zhaopin/?init=-1&salary=20$30&ckid=efd12b7a4c45b51d&headckid=efd12b7a4c45b51d&flushckid=1&fromSearchBtn=2&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=f54d8a69399c8673c64d9dbb3dc3d13e&d_curPage=0&d_pageSize=40&d_headId=f54d8a69399c8673c64d9dbb3dc3d13e',\n",
       " '30-50万': '/zhaopin/?init=-1&salary=30$50&ckid=efd12b7a4c45b51d&headckid=efd12b7a4c45b51d&flushckid=1&fromSearchBtn=2&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=f54d8a69399c8673c64d9dbb3dc3d13e&d_curPage=0&d_pageSize=40&d_headId=f54d8a69399c8673c64d9dbb3dc3d13e',\n",
       " '50-100万': '/zhaopin/?init=-1&salary=50$100&ckid=efd12b7a4c45b51d&headckid=efd12b7a4c45b51d&flushckid=1&fromSearchBtn=2&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=f54d8a69399c8673c64d9dbb3dc3d13e&d_curPage=0&d_pageSize=40&d_headId=f54d8a69399c8673c64d9dbb3dc3d13e',\n",
       " '100万以上': '/zhaopin/?init=-1&salary=100$999&ckid=efd12b7a4c45b51d&headckid=efd12b7a4c45b51d&flushckid=1&fromSearchBtn=2&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=f54d8a69399c8673c64d9dbb3dc3d13e&d_curPage=0&d_pageSize=40&d_headId=f54d8a69399c8673c64d9dbb3dc3d13e'}"
      ]
     },
     "execution_count": 24,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import pandas as pd\n",
    "from requests_html import HTMLSession\n",
    "\n",
    "url = \"https://www.liepin.com/zhaopin?\"\n",
    "session = HTMLSession()\n",
    "r = session.get( url )\n",
    "\n",
    "薪资数据选择器链结 = r.html.xpath('//div[@data-selector=\"search-conditions\"]')[0] \\\n",
    "                    .xpath('//dt[@class=\"search-title\"]/following-sibling::dd')[3] \\\n",
    "                    .xpath('//dd[contains(@data-param,\"salary\")]/a')\n",
    "薪资数据选择器链结\n",
    "\n",
    "薪资数据选择器链结 = { x.xpath(\"a/text()\")[0]:x.xpath(\"a/@href\")[0] for x in 薪资数据选择器链结}\n",
    "薪资数据选择器链结"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<class 'pandas.core.frame.DataFrame'>\n",
      "RangeIndex: 6 entries, 0 to 5\n",
      "Data columns (total 6 columns):\n",
      "scheme      6 non-null object\n",
      "netloc      6 non-null object\n",
      "path        6 non-null object\n",
      "params      6 non-null object\n",
      "query       6 non-null object\n",
      "fragment    6 non-null object\n",
      "dtypes: object(6)\n",
      "memory usage: 368.0+ bytes\n",
      "scheme      1\n",
      "netloc      1\n",
      "path        1\n",
      "params      1\n",
      "query       6\n",
      "fragment    1\n",
      "dtype: int64\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>scheme</th>\n",
       "      <th>netloc</th>\n",
       "      <th>path</th>\n",
       "      <th>params</th>\n",
       "      <th>query</th>\n",
       "      <th>fragment</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;salary=10$15&amp;ckid=efd12b7a4c45b51d&amp;hea...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;salary=15$20&amp;ckid=efd12b7a4c45b51d&amp;hea...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;salary=20$30&amp;ckid=efd12b7a4c45b51d&amp;hea...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;salary=30$50&amp;ckid=efd12b7a4c45b51d&amp;hea...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>init=-1&amp;salary=50$100&amp;ckid=efd12b7a4c45b51d&amp;he...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "  scheme netloc       path params  \\\n",
       "0                /zhaopin/          \n",
       "1                /zhaopin/          \n",
       "2                /zhaopin/          \n",
       "3                /zhaopin/          \n",
       "4                /zhaopin/          \n",
       "\n",
       "                                               query fragment  \n",
       "0  init=-1&salary=10$15&ckid=efd12b7a4c45b51d&hea...           \n",
       "1  init=-1&salary=15$20&ckid=efd12b7a4c45b51d&hea...           \n",
       "2  init=-1&salary=20$30&ckid=efd12b7a4c45b51d&hea...           \n",
       "3  init=-1&salary=30$50&ckid=efd12b7a4c45b51d&hea...           \n",
       "4  init=-1&salary=50$100&ckid=efd12b7a4c45b51d&he...           "
      ]
     },
     "execution_count": 25,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 解析url\n",
    "from urllib.parse import urlparse, parse_qs\n",
    "\n",
    "df = pd.DataFrame([ urlparse(x) for x in 薪资数据选择器链结.values()])\n",
    "df.info()\n",
    "print(df.nunique())\n",
    "df.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "ckid             1\n",
      "d_ckId           1\n",
      "d_curPage        1\n",
      "d_headId         1\n",
      "d_pageSize       1\n",
      "d_sfrom          1\n",
      "flushckid        1\n",
      "fromSearchBtn    1\n",
      "headckid         1\n",
      "init             1\n",
      "salary           6\n",
      "siTag            1\n",
      "dtype: int64\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>ckid</th>\n",
       "      <th>d_ckId</th>\n",
       "      <th>d_curPage</th>\n",
       "      <th>d_headId</th>\n",
       "      <th>d_pageSize</th>\n",
       "      <th>d_sfrom</th>\n",
       "      <th>flushckid</th>\n",
       "      <th>fromSearchBtn</th>\n",
       "      <th>headckid</th>\n",
       "      <th>init</th>\n",
       "      <th>salary</th>\n",
       "      <th>siTag</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>efd12b7a4c45b51d</td>\n",
       "      <td>f54d8a69399c8673c64d9dbb3dc3d13e</td>\n",
       "      <td>0</td>\n",
       "      <td>f54d8a69399c8673c64d9dbb3dc3d13e</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>efd12b7a4c45b51d</td>\n",
       "      <td>-1</td>\n",
       "      <td>10$15</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>efd12b7a4c45b51d</td>\n",
       "      <td>f54d8a69399c8673c64d9dbb3dc3d13e</td>\n",
       "      <td>0</td>\n",
       "      <td>f54d8a69399c8673c64d9dbb3dc3d13e</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>efd12b7a4c45b51d</td>\n",
       "      <td>-1</td>\n",
       "      <td>15$20</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>efd12b7a4c45b51d</td>\n",
       "      <td>f54d8a69399c8673c64d9dbb3dc3d13e</td>\n",
       "      <td>0</td>\n",
       "      <td>f54d8a69399c8673c64d9dbb3dc3d13e</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>efd12b7a4c45b51d</td>\n",
       "      <td>-1</td>\n",
       "      <td>20$30</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>efd12b7a4c45b51d</td>\n",
       "      <td>f54d8a69399c8673c64d9dbb3dc3d13e</td>\n",
       "      <td>0</td>\n",
       "      <td>f54d8a69399c8673c64d9dbb3dc3d13e</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>efd12b7a4c45b51d</td>\n",
       "      <td>-1</td>\n",
       "      <td>30$50</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>efd12b7a4c45b51d</td>\n",
       "      <td>f54d8a69399c8673c64d9dbb3dc3d13e</td>\n",
       "      <td>0</td>\n",
       "      <td>f54d8a69399c8673c64d9dbb3dc3d13e</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>efd12b7a4c45b51d</td>\n",
       "      <td>-1</td>\n",
       "      <td>50$100</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>efd12b7a4c45b51d</td>\n",
       "      <td>f54d8a69399c8673c64d9dbb3dc3d13e</td>\n",
       "      <td>0</td>\n",
       "      <td>f54d8a69399c8673c64d9dbb3dc3d13e</td>\n",
       "      <td>40</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>efd12b7a4c45b51d</td>\n",
       "      <td>-1</td>\n",
       "      <td>100$999</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "               ckid                            d_ckId d_curPage  \\\n",
       "0  efd12b7a4c45b51d  f54d8a69399c8673c64d9dbb3dc3d13e         0   \n",
       "1  efd12b7a4c45b51d  f54d8a69399c8673c64d9dbb3dc3d13e         0   \n",
       "2  efd12b7a4c45b51d  f54d8a69399c8673c64d9dbb3dc3d13e         0   \n",
       "3  efd12b7a4c45b51d  f54d8a69399c8673c64d9dbb3dc3d13e         0   \n",
       "4  efd12b7a4c45b51d  f54d8a69399c8673c64d9dbb3dc3d13e         0   \n",
       "5  efd12b7a4c45b51d  f54d8a69399c8673c64d9dbb3dc3d13e         0   \n",
       "\n",
       "                           d_headId d_pageSize         d_sfrom flushckid  \\\n",
       "0  f54d8a69399c8673c64d9dbb3dc3d13e         40  search_unknown         1   \n",
       "1  f54d8a69399c8673c64d9dbb3dc3d13e         40  search_unknown         1   \n",
       "2  f54d8a69399c8673c64d9dbb3dc3d13e         40  search_unknown         1   \n",
       "3  f54d8a69399c8673c64d9dbb3dc3d13e         40  search_unknown         1   \n",
       "4  f54d8a69399c8673c64d9dbb3dc3d13e         40  search_unknown         1   \n",
       "5  f54d8a69399c8673c64d9dbb3dc3d13e         40  search_unknown         1   \n",
       "\n",
       "  fromSearchBtn          headckid init   salary  \\\n",
       "0             2  efd12b7a4c45b51d   -1    10$15   \n",
       "1             2  efd12b7a4c45b51d   -1    15$20   \n",
       "2             2  efd12b7a4c45b51d   -1    20$30   \n",
       "3             2  efd12b7a4c45b51d   -1    30$50   \n",
       "4             2  efd12b7a4c45b51d   -1   50$100   \n",
       "5             2  efd12b7a4c45b51d   -1  100$999   \n",
       "\n",
       "                                           siTag  \n",
       "0  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "1  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "2  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "3  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "4  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  \n",
       "5  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw  "
      ]
     },
     "execution_count": 26,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# B-3 针对query 再解析之 \n",
    "#df_qs = pd.DataFrame([ parse_qs(x) for x in df['query'] ])\n",
    "df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "print (df_qs.nunique())\n",
    "df_qs.head(12)\n",
    "# df_qs[['keyword','industries']]  取表格中特定的某个值"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'init': ['-1'], 'salary': ['10$15'], 'ckid': ['efd12b7a4c45b51d'], 'headckid': ['efd12b7a4c45b51d'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['f54d8a69399c8673c64d9dbb3dc3d13e'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['f54d8a69399c8673c64d9dbb3dc3d13e']}\n",
      "{'10-15万': '10$15', '15-20万': '15$20', '20-30万': '20$30', '30-50万': '30$50', '50-100万': '50$100', '100万以上': '100$999'}\n"
     ]
    }
   ],
   "source": [
    "# 建构 参数模板 及 字典_salary\n",
    "def parse_url_qs_for_salary (url):\n",
    "    six_parts = urlparse(url) \n",
    "    out = parse_qs(six_parts.query)\n",
    "    return (out)\n",
    "\n",
    "# parse_url_qs_for_compTag(list(公司数据选择器链结.values())[0])['compTag']\n",
    "参数模板 = parse_url_qs_for_salary(list(薪资数据选择器链结.values())[0])\n",
    "print(参数模板)\n",
    "# [ parse_url_qs_for_compTag(x)['compTag'] for x in 公司数据选择器链结.values()]\n",
    "[ parse_url_qs_for_salary(x)['salary'][0] for x in 薪资数据选择器链结.values()]\n",
    "\n",
    "字典_salary = { k:parse_url_qs_for_salary(v)['salary'][0] for k,v in 薪资数据选择器链结.items()}\n",
    "print(字典_salary)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'10-15万': {'init': ['-1'], 'salary': ['10$15'], 'ckid': ['efd12b7a4c45b51d'], 'headckid': ['efd12b7a4c45b51d'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['f54d8a69399c8673c64d9dbb3dc3d13e'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['f54d8a69399c8673c64d9dbb3dc3d13e'], 'keyword': ['用户体验']}, '15-20万': {'init': ['-1'], 'salary': ['15$20'], 'ckid': ['efd12b7a4c45b51d'], 'headckid': ['efd12b7a4c45b51d'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['f54d8a69399c8673c64d9dbb3dc3d13e'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['f54d8a69399c8673c64d9dbb3dc3d13e'], 'keyword': ['用户体验']}, '20-30万': {'init': ['-1'], 'salary': ['20$30'], 'ckid': ['efd12b7a4c45b51d'], 'headckid': ['efd12b7a4c45b51d'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['f54d8a69399c8673c64d9dbb3dc3d13e'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['f54d8a69399c8673c64d9dbb3dc3d13e'], 'keyword': ['用户体验']}, '30-50万': {'init': ['-1'], 'salary': ['30$50'], 'ckid': ['efd12b7a4c45b51d'], 'headckid': ['efd12b7a4c45b51d'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['f54d8a69399c8673c64d9dbb3dc3d13e'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['f54d8a69399c8673c64d9dbb3dc3d13e'], 'keyword': ['用户体验']}, '50-100万': {'init': ['-1'], 'salary': ['50$100'], 'ckid': ['efd12b7a4c45b51d'], 'headckid': ['efd12b7a4c45b51d'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['f54d8a69399c8673c64d9dbb3dc3d13e'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['f54d8a69399c8673c64d9dbb3dc3d13e'], 'keyword': ['用户体验']}, '100万以上': {'init': ['-1'], 'salary': ['100$999'], 'ckid': ['efd12b7a4c45b51d'], 'headckid': ['efd12b7a4c45b51d'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['f54d8a69399c8673c64d9dbb3dc3d13e'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['f54d8a69399c8673c64d9dbb3dc3d13e'], 'keyword': ['用户体验']}}\n"
     ]
    }
   ],
   "source": [
    "# 生成城市参数模板  \n",
    "def 参数模板生成(salary , keyword ):\n",
    "    参数 = 参数模板.copy()  # 复制一份参数模版\n",
    "    参数['salary'] = salary\n",
    "    参数['keyword'] = keyword\n",
    "    return (参数)\n",
    "\n",
    "# 赋值：keyword\n",
    "参数_salary_用户体验 = { k:参数模板生成(salary = [v], keyword = ['用户体验']) for k,v in 字典_salary.items()}\n",
    "print(参数_salary_用户体验)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [],
   "source": [
    "# request请求\n",
    "session = HTMLSession()\n",
    "\n",
    "def requests_liepin( url, params):\n",
    "    r = session.get( url , params = payload)\n",
    "\n",
    "    # 先取特定元素, 精准打击其子后辈\n",
    "    主要元素 = r.html.xpath( '//ul[@class=\"sojob-list\"]/li')\n",
    "\n",
    "    # 作为xpath字典，键为我要抓的牛肉名称，值为xpath\n",
    "    dict_xpaths={ \n",
    "        'text': {\n",
    "            'edu':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]',\n",
    "            '经验':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]/following-sibling::span',\n",
    "            '薪水':    '//div[contains(@class,\"job-info\")]/p/span[@class=\"text-warning\"]', \n",
    "            '时间':    '//div[contains(@class,\"job-info\")]/p/time/@title', \n",
    "            '职称':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '行业': '//div[contains(@class,\"job-info\")]/p/a',\n",
    "            '公司名称': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        },\n",
    "        'text_content': {\n",
    "        },\n",
    "        'href': {\n",
    "            '链结':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '公司URL': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        }\n",
    "    }\n",
    "\n",
    "    def get_e_text_content(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [e.xpath(_xpath_)[0].lxml.text_content() for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_text(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [\"\".join([x.strip() if type(x) is str else x.text.strip() for x in e.xpath(_xpath_)]) for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_href(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [list(e.xpath(_xpath_, first=True).absolute_links)[0] \\\n",
    "                   if len(e.xpath(_xpath_, first=True).absolute_links) >= 1  \\\n",
    "                   else \"\" for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    # 只对主要元素下进行.xpath取值\n",
    "    数据字典 = dict()\n",
    "\n",
    "    数据字典 = {k:get_e_text_content(v) for k,v in dict_xpaths['text_content'].items()}\n",
    "    数据字典.update({k:get_e_text(v) for k,v in dict_xpaths['text'].items()})\n",
    "    数据字典.update({k:get_e_href(v) for k,v in dict_xpaths['href'].items()})\n",
    "\n",
    "    数据 = pd.DataFrame(数据字典)\n",
    "    #数据.to_excel(\"20春_Web数据挖掘_week03_liepin.xlsx\", sheet_name=\"搜查结果\")\n",
    "    return (数据)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>edu</th>\n",
       "      <th>经验</th>\n",
       "      <th>薪水</th>\n",
       "      <th>时间</th>\n",
       "      <th>职称</th>\n",
       "      <th>行业</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>链结</th>\n",
       "      <th>公司URL</th>\n",
       "      <th>薪资水平</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>7-10k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>市场经理</td>\n",
       "      <td>深圳-宝安区</td>\n",
       "      <td>深圳市耀美环保有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927771863.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9234847/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>9-15k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>薪酬绩效主管</td>\n",
       "      <td>上海</td>\n",
       "      <td>中翔金属(上海)有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927771369.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9454064/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>数据库工程师 DBA</td>\n",
       "      <td>上海-曲阳</td>\n",
       "      <td>MDC Telecom</td>\n",
       "      <td>https://www.liepin.com/job/1927770857.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8104849/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>8-13k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>课程顾问</td>\n",
       "      <td>北京</td>\n",
       "      <td>北京新得科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927770073.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9807335/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>网络安全工程师（网攻方向）</td>\n",
       "      <td></td>\n",
       "      <td>北京华油信通科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927769745.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8330229/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>审计总监</td>\n",
       "      <td>德州</td>\n",
       "      <td>泰山体育</td>\n",
       "      <td>https://www.liepin.com/job/1927769743.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7958679/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>海外售后技术支持经理（法语）/Overseas After Sales Technical ...</td>\n",
       "      <td>上海</td>\n",
       "      <td>爱驰汽车</td>\n",
       "      <td>https://www.liepin.com/job/1927769147.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9146383/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>8-20k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>咨询顾问</td>\n",
       "      <td>上海-青浦区</td>\n",
       "      <td>上海爱湃斯科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927767341.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10006015/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>8-12k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>质量PQE工程师</td>\n",
       "      <td>珠海-香洲区</td>\n",
       "      <td>英搏尔</td>\n",
       "      <td>https://www.liepin.com/job/1927766961.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9557666/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>8-15k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>质量PQE主管</td>\n",
       "      <td>珠海-香洲区</td>\n",
       "      <td>英搏尔</td>\n",
       "      <td>https://www.liepin.com/job/1927766881.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9557666/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>7-15k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>质量SQE工程师</td>\n",
       "      <td>珠海-香洲区</td>\n",
       "      <td>英搏尔</td>\n",
       "      <td>https://www.liepin.com/job/1927766799.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9557666/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>8-10k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>空运副经理/经理</td>\n",
       "      <td>西安-高新区</td>\n",
       "      <td>海得邦国际物流控股(集团)有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927766623.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10079421/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>8-10k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>综合主管</td>\n",
       "      <td>北京</td>\n",
       "      <td>亿达控股有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927766331.shtml</td>\n",
       "      <td>https://www.liepin.com/company/2048766/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>学历不限</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>技术员，DMT&amp;MB实验室</td>\n",
       "      <td>上海-张江</td>\n",
       "      <td>罗氏制药</td>\n",
       "      <td>https://www.liepin.com/job/1927766269.shtml</td>\n",
       "      <td>https://www.liepin.com/company/916012/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>12-16k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>模具项目工程师</td>\n",
       "      <td></td>\n",
       "      <td>滁州市博康模具塑料有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927764739.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8593126/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>6-15k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>模具设计工程师（密封-新能源）</td>\n",
       "      <td>广州-黄埔区</td>\n",
       "      <td>国机智能</td>\n",
       "      <td>https://www.liepin.com/job/1927749185.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8942684/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>10-20k·13薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>客服主管</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>泽金金服</td>\n",
       "      <td>https://www.liepin.com/job/1927746007.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8787574/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>6-8k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>财务收银</td>\n",
       "      <td>杭州-下城区</td>\n",
       "      <td>阳光城集团</td>\n",
       "      <td>https://www.liepin.com/job/1927744955.shtml</td>\n",
       "      <td>https://www.liepin.com/company/876734/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>学历不限</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>5-12k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>光电顾问</td>\n",
       "      <td>南京-江宁区</td>\n",
       "      <td>江苏灵美东方医院管理有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927739435.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10030447/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>6-10k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>总账会计</td>\n",
       "      <td>深圳-宝安区</td>\n",
       "      <td>HKC</td>\n",
       "      <td>https://www.liepin.com/job/1927733447.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8795947/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>10-18k·15薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>成本副经理/主管</td>\n",
       "      <td>广州-花都区</td>\n",
       "      <td>鸿利光电</td>\n",
       "      <td>https://www.liepin.com/job/1927727601.shtml</td>\n",
       "      <td>https://www.liepin.com/company/2246346/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>店铺店长</td>\n",
       "      <td>上海-杨浦区</td>\n",
       "      <td>百合网</td>\n",
       "      <td>https://www.liepin.com/job/1927726909.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10077527/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>薪酬绩效专家</td>\n",
       "      <td>杭州</td>\n",
       "      <td>农夫山泉</td>\n",
       "      <td>https://www.liepin.com/job/1927726751.shtml</td>\n",
       "      <td>https://www.liepin.com/company/2868477/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>新媒体运营/文案策划</td>\n",
       "      <td>上海-徐汇区</td>\n",
       "      <td>上海宜来卫浴有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927711449.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10082469/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>销售人力资源部总监</td>\n",
       "      <td>杭州</td>\n",
       "      <td>农夫山泉</td>\n",
       "      <td>https://www.liepin.com/job/1927710481.shtml</td>\n",
       "      <td>https://www.liepin.com/company/2868477/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>生产主管</td>\n",
       "      <td>上海-浦东新区</td>\n",
       "      <td>上海微创心通医疗科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927706945.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9494398/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>6-8k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>案场经理</td>\n",
       "      <td>荆门</td>\n",
       "      <td>浙江祥生物业服务有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927698187.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9115685/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>港口物流经理</td>\n",
       "      <td>扬州</td>\n",
       "      <td>君明实业集团有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927697843.shtml</td>\n",
       "      <td>https://www.liepin.com/company/12180625/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>7-12k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>java开发工程师</td>\n",
       "      <td>郑州</td>\n",
       "      <td>郑州格蒂电力智能科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927692971.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10095389/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>游戏特效</td>\n",
       "      <td>北京</td>\n",
       "      <td>北京涂鸦多得科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927691417.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7877511/</td>\n",
       "      <td>10-15万</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>储备学校总校长</td>\n",
       "      <td>长沙</td>\n",
       "      <td>上海中锐教育发展有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927771441.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10117087/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>储备学校总校长</td>\n",
       "      <td>苏州</td>\n",
       "      <td>上海中锐教育发展有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927771439.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10117087/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>储备学校总校长</td>\n",
       "      <td>上海</td>\n",
       "      <td>上海中锐教育发展有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927771437.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10117087/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>70-100k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>算法总监</td>\n",
       "      <td>北京</td>\n",
       "      <td>福佑卡车</td>\n",
       "      <td>https://www.liepin.com/job/1927770267.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10058353/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>50-80k·13薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>技术专家/技术总监</td>\n",
       "      <td>上海-张江</td>\n",
       "      <td>上海擎创信息技术有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927768823.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9173769/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>95-150k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>技术总监</td>\n",
       "      <td>成都</td>\n",
       "      <td>成都聚创伟业电子商务有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927768425.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9699967/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>智能谷负责人</td>\n",
       "      <td>上海-青浦区</td>\n",
       "      <td>上海爱仕达机器人有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927767777.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10172529/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>博士</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>Resin GM</td>\n",
       "      <td>上海</td>\n",
       "      <td>米高蒲志国际(香港)有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927767483.shtml</td>\n",
       "      <td>https://www.liepin.com/company/1790705/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>RA Senior Director - Asia</td>\n",
       "      <td>上海</td>\n",
       "      <td>米高蒲志国际(香港)有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927766255.shtml</td>\n",
       "      <td>https://www.liepin.com/company/1790705/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>70-100k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>交付经理</td>\n",
       "      <td>深圳-龙岗区</td>\n",
       "      <td>深南电路</td>\n",
       "      <td>https://www.liepin.com/job/1927764193.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8136258/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>70-100k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>通信系统工程师（专家级）</td>\n",
       "      <td></td>\n",
       "      <td>北京九天微星科技发展有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927763193.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9247111/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>100-130k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>首席运营官（COO）</td>\n",
       "      <td>珠海-迎宾</td>\n",
       "      <td>爱婴岛新零售管理有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927761455.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9090500/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>30-60k·18薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>腾讯云安全后台开发工程师</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>腾讯</td>\n",
       "      <td>https://www.liepin.com/job/1927760483.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7983148/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>30-60k·18薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>售后技术支持工程师</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>腾讯</td>\n",
       "      <td>https://www.liepin.com/job/1927760395.shtml</td>\n",
       "      <td>https://www.liepin.com/company/7983148/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>50-100k·12薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>大湾区事业部总监</td>\n",
       "      <td>深圳</td>\n",
       "      <td>中舍控股(深圳)有限责任公司</td>\n",
       "      <td>https://www.liepin.com/job/1927756871.shtml</td>\n",
       "      <td>https://www.liepin.com/company/12222055/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>35-65k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>阿里淘小铺掌柜（合伙人）</td>\n",
       "      <td>武汉-江汉区</td>\n",
       "      <td>湖北古荆州酒业有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927755049.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10020805/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>35-65k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>淘小铺掌柜（合伙人）</td>\n",
       "      <td>长沙-芙蓉区</td>\n",
       "      <td>湖北古荆州酒业有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927755013.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10020805/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>35-65k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>阿里淘小铺掌柜（合伙人）</td>\n",
       "      <td>广州-越秀区</td>\n",
       "      <td>湖北古荆州酒业有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927754935.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10020805/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>语音算法总监</td>\n",
       "      <td>上海</td>\n",
       "      <td>竹间智能</td>\n",
       "      <td>https://www.liepin.com/job/1927740819.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8608119/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>50-70k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>项目总经理</td>\n",
       "      <td>深圳-罗湖区</td>\n",
       "      <td>深圳市东旭鸿基地产有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927734901.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9645744/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>35-65k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>淘小铺掌柜（合伙人）</td>\n",
       "      <td>南京-玄武区</td>\n",
       "      <td>湖北古荆州酒业有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927731723.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10020805/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>35-65k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>淘小铺掌柜（合伙人）</td>\n",
       "      <td>上海-黄浦区</td>\n",
       "      <td>湖北古荆州酒业有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927731713.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10020805/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>35-65k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>淘小铺掌柜（合伙人）</td>\n",
       "      <td></td>\n",
       "      <td>湖北古荆州酒业有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927731701.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10020805/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>35-65k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>淘小铺掌柜（合伙人）</td>\n",
       "      <td>武汉-武昌区</td>\n",
       "      <td>湖北古荆州酒业有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927731679.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10020805/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>35-65k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>淘小铺掌柜（合伙人）</td>\n",
       "      <td>苏州-昆山</td>\n",
       "      <td>湖北古荆州酒业有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927731577.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10020805/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>35-65k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>淘小铺掌柜（合伙人）</td>\n",
       "      <td>厦门-思明区</td>\n",
       "      <td>湖北古荆州酒业有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927731555.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10020805/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>50-65k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>淘小铺掌柜（合伙人）</td>\n",
       "      <td>绍兴-越城区</td>\n",
       "      <td>湖北古荆州酒业有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927731551.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10020805/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>35-65k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>淘小铺掌柜（合伙人）</td>\n",
       "      <td>杭州-拱墅区</td>\n",
       "      <td>湖北古荆州酒业有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927731485.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10020805/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>35-65k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>淘小铺掌柜（合伙人）</td>\n",
       "      <td>深圳-福田区</td>\n",
       "      <td>湖北古荆州酒业有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927731457.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10020805/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>35-65k·16薪</td>\n",
       "      <td>2020年04月26日</td>\n",
       "      <td>淘小铺掌柜（合伙人）</td>\n",
       "      <td>广州-天河北</td>\n",
       "      <td>湖北古荆州酒业有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1927731439.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10020805/</td>\n",
       "      <td>100万以上</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>240 rows × 10 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      edu     经验            薪水           时间  \\\n",
       "0   大专及以上   3-5年     7-10k·12薪  2020年04月26日   \n",
       "1   大专及以上   1-3年     9-15k·12薪  2020年04月26日   \n",
       "2    统招本科   3-5年            面议  2020年04月26日   \n",
       "3   大专及以上   1-3年     8-13k·12薪  2020年04月26日   \n",
       "4    统招本科   1-3年            面议  2020年04月26日   \n",
       "5   大专及以上  5-10年    10-15k·12薪  2020年04月26日   \n",
       "6   本科及以上   3-5年            面议  2020年04月26日   \n",
       "7    统招本科   1-3年     8-20k·12薪  2020年04月26日   \n",
       "8   大专及以上   3-5年     8-12k·12薪  2020年04月26日   \n",
       "9   大专及以上   3-5年     8-15k·12薪  2020年04月26日   \n",
       "10  大专及以上   3-5年     7-15k·12薪  2020年04月26日   \n",
       "11  大专及以上  5-10年     8-10k·12薪  2020年04月26日   \n",
       "12   统招本科   3-5年     8-10k·12薪  2020年04月26日   \n",
       "13   学历不限   1-3年            面议  2020年04月26日   \n",
       "14  大专及以上  5-10年    12-16k·12薪  2020年04月26日   \n",
       "15  大专及以上   1-3年     6-15k·12薪  2020年04月26日   \n",
       "16  本科及以上   3-5年    10-20k·13薪  2020年04月26日   \n",
       "17  本科及以上   1-3年      6-8k·12薪  2020年04月26日   \n",
       "18   学历不限   1-3年     5-12k·12薪  2020年04月26日   \n",
       "19  本科及以上   1-3年     6-10k·12薪  2020年04月26日   \n",
       "20  本科及以上  5-10年    10-18k·15薪  2020年04月26日   \n",
       "21  大专及以上   1-3年    10-15k·12薪  2020年04月26日   \n",
       "22   统招本科  5-10年            面议  2020年04月26日   \n",
       "23  大专及以上   1-3年    10-15k·12薪  2020年04月26日   \n",
       "24   统招本科  5-10年            面议  2020年04月26日   \n",
       "25  大专及以上   3-5年            面议  2020年04月26日   \n",
       "26  大专及以上   1-3年      6-8k·12薪  2020年04月26日   \n",
       "27  大专及以上  5-10年            面议  2020年04月26日   \n",
       "28  大专及以上   3-5年     7-12k·12薪  2020年04月26日   \n",
       "29  大专及以上   经验不限            面议  2020年04月26日   \n",
       "..    ...    ...           ...          ...   \n",
       "10  本科及以上  10年以上            面议  2020年04月26日   \n",
       "11  本科及以上  10年以上            面议  2020年04月26日   \n",
       "12  本科及以上  10年以上            面议  2020年04月26日   \n",
       "13  本科及以上   经验不限   70-100k·12薪  2020年04月26日   \n",
       "14   统招本科  10年以上    50-80k·13薪  2020年04月26日   \n",
       "15  本科及以上  10年以上   95-150k·12薪  2020年04月26日   \n",
       "16   统招本科  10年以上            面议  2020年04月26日   \n",
       "17     博士   经验不限            面议  2020年04月26日   \n",
       "18  硕士及以上  10年以上            面议  2020年04月26日   \n",
       "19  本科及以上   1-3年   70-100k·12薪  2020年04月26日   \n",
       "20  硕士及以上  10年以上   70-100k·12薪  2020年04月26日   \n",
       "21  大专及以上  10年以上  100-130k·12薪  2020年04月26日   \n",
       "22  本科及以上  5-10年    30-60k·18薪  2020年04月26日   \n",
       "23  硕士及以上   3-5年    30-60k·18薪  2020年04月26日   \n",
       "24  本科及以上   经验不限   50-100k·12薪  2020年04月26日   \n",
       "25  大专及以上   1-3年    35-65k·16薪  2020年04月26日   \n",
       "26  大专及以上   1-3年    35-65k·16薪  2020年04月26日   \n",
       "27  大专及以上   1-3年    35-65k·16薪  2020年04月26日   \n",
       "28  硕士及以上  5-10年            面议  2020年04月26日   \n",
       "29  本科及以上  5-10年    50-70k·16薪  2020年04月26日   \n",
       "30  大专及以上   1-3年    35-65k·16薪  2020年04月26日   \n",
       "31  大专及以上   1-3年    35-65k·16薪  2020年04月26日   \n",
       "32  大专及以上   1-3年    35-65k·16薪  2020年04月26日   \n",
       "33  大专及以上   1-3年    35-65k·16薪  2020年04月26日   \n",
       "34  大专及以上   1-3年    35-65k·16薪  2020年04月26日   \n",
       "35  大专及以上   1-3年    35-65k·16薪  2020年04月26日   \n",
       "36  大专及以上   1-3年    50-65k·16薪  2020年04月26日   \n",
       "37  大专及以上   1-3年    35-65k·16薪  2020年04月26日   \n",
       "38  大专及以上   1-3年    35-65k·16薪  2020年04月26日   \n",
       "39  大专及以上   1-3年    35-65k·16薪  2020年04月26日   \n",
       "\n",
       "                                                   职称       行业  \\\n",
       "0                                                市场经理   深圳-宝安区   \n",
       "1                                              薪酬绩效主管       上海   \n",
       "2                                          数据库工程师 DBA    上海-曲阳   \n",
       "3                                                课程顾问       北京   \n",
       "4                                       网络安全工程师（网攻方向）            \n",
       "5                                                审计总监       德州   \n",
       "6   海外售后技术支持经理（法语）/Overseas After Sales Technical ...       上海   \n",
       "7                                                咨询顾问   上海-青浦区   \n",
       "8                                            质量PQE工程师   珠海-香洲区   \n",
       "9                                             质量PQE主管   珠海-香洲区   \n",
       "10                                           质量SQE工程师   珠海-香洲区   \n",
       "11                                           空运副经理/经理   西安-高新区   \n",
       "12                                               综合主管       北京   \n",
       "13                                      技术员，DMT&MB实验室    上海-张江   \n",
       "14                                            模具项目工程师            \n",
       "15                                    模具设计工程师（密封-新能源）   广州-黄埔区   \n",
       "16                                               客服主管   深圳-南山区   \n",
       "17                                               财务收银   杭州-下城区   \n",
       "18                                               光电顾问   南京-江宁区   \n",
       "19                                               总账会计   深圳-宝安区   \n",
       "20                                           成本副经理/主管   广州-花都区   \n",
       "21                                               店铺店长   上海-杨浦区   \n",
       "22                                             薪酬绩效专家       杭州   \n",
       "23                                         新媒体运营/文案策划   上海-徐汇区   \n",
       "24                                          销售人力资源部总监       杭州   \n",
       "25                                               生产主管  上海-浦东新区   \n",
       "26                                               案场经理       荆门   \n",
       "27                                             港口物流经理       扬州   \n",
       "28                                          java开发工程师       郑州   \n",
       "29                                               游戏特效       北京   \n",
       "..                                                ...      ...   \n",
       "10                                            储备学校总校长       长沙   \n",
       "11                                            储备学校总校长       苏州   \n",
       "12                                            储备学校总校长       上海   \n",
       "13                                               算法总监       北京   \n",
       "14                                          技术专家/技术总监    上海-张江   \n",
       "15                                               技术总监       成都   \n",
       "16                                             智能谷负责人   上海-青浦区   \n",
       "17                                           Resin GM       上海   \n",
       "18                          RA Senior Director - Asia       上海   \n",
       "19                                               交付经理   深圳-龙岗区   \n",
       "20                                       通信系统工程师（专家级）            \n",
       "21                                         首席运营官（COO）    珠海-迎宾   \n",
       "22                                       腾讯云安全后台开发工程师   深圳-南山区   \n",
       "23                                          售后技术支持工程师   深圳-南山区   \n",
       "24                                           大湾区事业部总监       深圳   \n",
       "25                                       阿里淘小铺掌柜（合伙人）   武汉-江汉区   \n",
       "26                                         淘小铺掌柜（合伙人）   长沙-芙蓉区   \n",
       "27                                       阿里淘小铺掌柜（合伙人）   广州-越秀区   \n",
       "28                                             语音算法总监       上海   \n",
       "29                                              项目总经理   深圳-罗湖区   \n",
       "30                                         淘小铺掌柜（合伙人）   南京-玄武区   \n",
       "31                                         淘小铺掌柜（合伙人）   上海-黄浦区   \n",
       "32                                         淘小铺掌柜（合伙人）            \n",
       "33                                         淘小铺掌柜（合伙人）   武汉-武昌区   \n",
       "34                                         淘小铺掌柜（合伙人）    苏州-昆山   \n",
       "35                                         淘小铺掌柜（合伙人）   厦门-思明区   \n",
       "36                                         淘小铺掌柜（合伙人）   绍兴-越城区   \n",
       "37                                         淘小铺掌柜（合伙人）   杭州-拱墅区   \n",
       "38                                         淘小铺掌柜（合伙人）   深圳-福田区   \n",
       "39                                         淘小铺掌柜（合伙人）   广州-天河北   \n",
       "\n",
       "                 公司名称                                           链结  \\\n",
       "0         深圳市耀美环保有限公司  https://www.liepin.com/job/1927771863.shtml   \n",
       "1        中翔金属(上海)有限公司  https://www.liepin.com/job/1927771369.shtml   \n",
       "2         MDC Telecom  https://www.liepin.com/job/1927770857.shtml   \n",
       "3          北京新得科技有限公司  https://www.liepin.com/job/1927770073.shtml   \n",
       "4        北京华油信通科技有限公司  https://www.liepin.com/job/1927769745.shtml   \n",
       "5                泰山体育  https://www.liepin.com/job/1927769743.shtml   \n",
       "6                爱驰汽车  https://www.liepin.com/job/1927769147.shtml   \n",
       "7         上海爱湃斯科技有限公司  https://www.liepin.com/job/1927767341.shtml   \n",
       "8                 英搏尔  https://www.liepin.com/job/1927766961.shtml   \n",
       "9                 英搏尔  https://www.liepin.com/job/1927766881.shtml   \n",
       "10                英搏尔  https://www.liepin.com/job/1927766799.shtml   \n",
       "11  海得邦国际物流控股(集团)有限公司  https://www.liepin.com/job/1927766623.shtml   \n",
       "12           亿达控股有限公司  https://www.liepin.com/job/1927766331.shtml   \n",
       "13               罗氏制药  https://www.liepin.com/job/1927766269.shtml   \n",
       "14      滁州市博康模具塑料有限公司  https://www.liepin.com/job/1927764739.shtml   \n",
       "15               国机智能  https://www.liepin.com/job/1927749185.shtml   \n",
       "16               泽金金服  https://www.liepin.com/job/1927746007.shtml   \n",
       "17              阳光城集团  https://www.liepin.com/job/1927744955.shtml   \n",
       "18     江苏灵美东方医院管理有限公司  https://www.liepin.com/job/1927739435.shtml   \n",
       "19                HKC  https://www.liepin.com/job/1927733447.shtml   \n",
       "20               鸿利光电  https://www.liepin.com/job/1927727601.shtml   \n",
       "21                百合网  https://www.liepin.com/job/1927726909.shtml   \n",
       "22               农夫山泉  https://www.liepin.com/job/1927726751.shtml   \n",
       "23         上海宜来卫浴有限公司  https://www.liepin.com/job/1927711449.shtml   \n",
       "24               农夫山泉  https://www.liepin.com/job/1927710481.shtml   \n",
       "25     上海微创心通医疗科技有限公司  https://www.liepin.com/job/1927706945.shtml   \n",
       "26       浙江祥生物业服务有限公司  https://www.liepin.com/job/1927698187.shtml   \n",
       "27         君明实业集团有限公司  https://www.liepin.com/job/1927697843.shtml   \n",
       "28     郑州格蒂电力智能科技有限公司  https://www.liepin.com/job/1927692971.shtml   \n",
       "29       北京涂鸦多得科技有限公司  https://www.liepin.com/job/1927691417.shtml   \n",
       "..                ...                                          ...   \n",
       "10       上海中锐教育发展有限公司  https://www.liepin.com/job/1927771441.shtml   \n",
       "11       上海中锐教育发展有限公司  https://www.liepin.com/job/1927771439.shtml   \n",
       "12       上海中锐教育发展有限公司  https://www.liepin.com/job/1927771437.shtml   \n",
       "13               福佑卡车  https://www.liepin.com/job/1927770267.shtml   \n",
       "14       上海擎创信息技术有限公司  https://www.liepin.com/job/1927768823.shtml   \n",
       "15     成都聚创伟业电子商务有限公司  https://www.liepin.com/job/1927768425.shtml   \n",
       "16       上海爱仕达机器人有限公司  https://www.liepin.com/job/1927767777.shtml   \n",
       "17     米高蒲志国际(香港)有限公司  https://www.liepin.com/job/1927767483.shtml   \n",
       "18     米高蒲志国际(香港)有限公司  https://www.liepin.com/job/1927766255.shtml   \n",
       "19               深南电路  https://www.liepin.com/job/1927764193.shtml   \n",
       "20     北京九天微星科技发展有限公司  https://www.liepin.com/job/1927763193.shtml   \n",
       "21       爱婴岛新零售管理有限公司  https://www.liepin.com/job/1927761455.shtml   \n",
       "22                 腾讯  https://www.liepin.com/job/1927760483.shtml   \n",
       "23                 腾讯  https://www.liepin.com/job/1927760395.shtml   \n",
       "24     中舍控股(深圳)有限责任公司  https://www.liepin.com/job/1927756871.shtml   \n",
       "25        湖北古荆州酒业有限公司  https://www.liepin.com/job/1927755049.shtml   \n",
       "26        湖北古荆州酒业有限公司  https://www.liepin.com/job/1927755013.shtml   \n",
       "27        湖北古荆州酒业有限公司  https://www.liepin.com/job/1927754935.shtml   \n",
       "28               竹间智能  https://www.liepin.com/job/1927740819.shtml   \n",
       "29      深圳市东旭鸿基地产有限公司  https://www.liepin.com/job/1927734901.shtml   \n",
       "30        湖北古荆州酒业有限公司  https://www.liepin.com/job/1927731723.shtml   \n",
       "31        湖北古荆州酒业有限公司  https://www.liepin.com/job/1927731713.shtml   \n",
       "32        湖北古荆州酒业有限公司  https://www.liepin.com/job/1927731701.shtml   \n",
       "33        湖北古荆州酒业有限公司  https://www.liepin.com/job/1927731679.shtml   \n",
       "34        湖北古荆州酒业有限公司  https://www.liepin.com/job/1927731577.shtml   \n",
       "35        湖北古荆州酒业有限公司  https://www.liepin.com/job/1927731555.shtml   \n",
       "36        湖北古荆州酒业有限公司  https://www.liepin.com/job/1927731551.shtml   \n",
       "37        湖北古荆州酒业有限公司  https://www.liepin.com/job/1927731485.shtml   \n",
       "38        湖北古荆州酒业有限公司  https://www.liepin.com/job/1927731457.shtml   \n",
       "39        湖北古荆州酒业有限公司  https://www.liepin.com/job/1927731439.shtml   \n",
       "\n",
       "                                       公司URL    薪资水平  \n",
       "0    https://www.liepin.com/company/9234847/  10-15万  \n",
       "1    https://www.liepin.com/company/9454064/  10-15万  \n",
       "2    https://www.liepin.com/company/8104849/  10-15万  \n",
       "3    https://www.liepin.com/company/9807335/  10-15万  \n",
       "4    https://www.liepin.com/company/8330229/  10-15万  \n",
       "5    https://www.liepin.com/company/7958679/  10-15万  \n",
       "6    https://www.liepin.com/company/9146383/  10-15万  \n",
       "7   https://www.liepin.com/company/10006015/  10-15万  \n",
       "8    https://www.liepin.com/company/9557666/  10-15万  \n",
       "9    https://www.liepin.com/company/9557666/  10-15万  \n",
       "10   https://www.liepin.com/company/9557666/  10-15万  \n",
       "11  https://www.liepin.com/company/10079421/  10-15万  \n",
       "12   https://www.liepin.com/company/2048766/  10-15万  \n",
       "13    https://www.liepin.com/company/916012/  10-15万  \n",
       "14   https://www.liepin.com/company/8593126/  10-15万  \n",
       "15   https://www.liepin.com/company/8942684/  10-15万  \n",
       "16   https://www.liepin.com/company/8787574/  10-15万  \n",
       "17    https://www.liepin.com/company/876734/  10-15万  \n",
       "18  https://www.liepin.com/company/10030447/  10-15万  \n",
       "19   https://www.liepin.com/company/8795947/  10-15万  \n",
       "20   https://www.liepin.com/company/2246346/  10-15万  \n",
       "21  https://www.liepin.com/company/10077527/  10-15万  \n",
       "22   https://www.liepin.com/company/2868477/  10-15万  \n",
       "23  https://www.liepin.com/company/10082469/  10-15万  \n",
       "24   https://www.liepin.com/company/2868477/  10-15万  \n",
       "25   https://www.liepin.com/company/9494398/  10-15万  \n",
       "26   https://www.liepin.com/company/9115685/  10-15万  \n",
       "27  https://www.liepin.com/company/12180625/  10-15万  \n",
       "28  https://www.liepin.com/company/10095389/  10-15万  \n",
       "29   https://www.liepin.com/company/7877511/  10-15万  \n",
       "..                                       ...     ...  \n",
       "10  https://www.liepin.com/company/10117087/  100万以上  \n",
       "11  https://www.liepin.com/company/10117087/  100万以上  \n",
       "12  https://www.liepin.com/company/10117087/  100万以上  \n",
       "13  https://www.liepin.com/company/10058353/  100万以上  \n",
       "14   https://www.liepin.com/company/9173769/  100万以上  \n",
       "15   https://www.liepin.com/company/9699967/  100万以上  \n",
       "16  https://www.liepin.com/company/10172529/  100万以上  \n",
       "17   https://www.liepin.com/company/1790705/  100万以上  \n",
       "18   https://www.liepin.com/company/1790705/  100万以上  \n",
       "19   https://www.liepin.com/company/8136258/  100万以上  \n",
       "20   https://www.liepin.com/company/9247111/  100万以上  \n",
       "21   https://www.liepin.com/company/9090500/  100万以上  \n",
       "22   https://www.liepin.com/company/7983148/  100万以上  \n",
       "23   https://www.liepin.com/company/7983148/  100万以上  \n",
       "24  https://www.liepin.com/company/12222055/  100万以上  \n",
       "25  https://www.liepin.com/company/10020805/  100万以上  \n",
       "26  https://www.liepin.com/company/10020805/  100万以上  \n",
       "27  https://www.liepin.com/company/10020805/  100万以上  \n",
       "28   https://www.liepin.com/company/8608119/  100万以上  \n",
       "29   https://www.liepin.com/company/9645744/  100万以上  \n",
       "30  https://www.liepin.com/company/10020805/  100万以上  \n",
       "31  https://www.liepin.com/company/10020805/  100万以上  \n",
       "32  https://www.liepin.com/company/10020805/  100万以上  \n",
       "33  https://www.liepin.com/company/10020805/  100万以上  \n",
       "34  https://www.liepin.com/company/10020805/  100万以上  \n",
       "35  https://www.liepin.com/company/10020805/  100万以上  \n",
       "36  https://www.liepin.com/company/10020805/  100万以上  \n",
       "37  https://www.liepin.com/company/10020805/  100万以上  \n",
       "38  https://www.liepin.com/company/10020805/  100万以上  \n",
       "39  https://www.liepin.com/company/10020805/  100万以上  \n",
       "\n",
       "[240 rows x 10 columns]"
      ]
     },
     "execution_count": 30,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "url = \"https://www.liepin.com/zhaopin/\"\n",
    "\n",
    "list_df = list()\n",
    "for k,v in 参数_salary_用户体验.items():\n",
    "    payload = v\n",
    "    df = requests_liepin( url, params = payload)\n",
    "    df = df.assign (薪资水平 = k)    \n",
    "    list_df.append(df)\n",
    "\n",
    "df_all = pd.concat(list_df)\n",
    "df_all"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "metadata": {},
   "outputs": [],
   "source": [
    "# C-4   输出\n",
    "df_all.to_excel(\"薪资类型的数据爬取.xlsx\", sheet_name=\"搜查结果\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 翻页模版构建"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[<Element 'a' href='/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=1'>, <Element 'a' href='/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=2'>, <Element 'a' href='/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=3'>, <Element 'a' href='/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=4'>, <Element 'a' href='/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=1'>, <Element 'a' class=('last',) href='/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=9' title='末页'>]\n"
     ]
    }
   ],
   "source": [
    "# 翻页：参数字典的拆解→xpath解析翻页a/@href\n",
    "url = \"https://www.liepin.com/zhaopin/?keyword=人力资源\"\n",
    "session = HTMLSession()\n",
    "r = session.get( url )\n",
    "# A-1  xpath 解析翻页a/@href\n",
    "xpath_翻页a = '//div[@class=\"pagerbar\"]/a' # 有disabled, current等href是javascript\n",
    "xpath_翻页a = '//div[@class=\"pagerbar\"]/a[starts-with(@href,\"/zhaopin\")]'\n",
    "print (r.html.xpath(xpath_翻页a)) # 物件"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=1', '/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=2', '/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=3', '/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=4', '/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=1', '/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=9']\n"
     ]
    }
   ],
   "source": [
    "# 把上面的翻页url变成列表并且去除不必要的元素\n",
    "href_列表 = [x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)]\n",
    "print (href_列表)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'2': '/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=1', '3': '/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=2', '4': '/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=3', '5': '/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=4', '下一页': '/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=1', '': '/zhaopin/?init=-1&headckid=c1e2a51184667c72&fromSearchBtn=2&keyword=%E4%BA%BA%E5%8A%9B%E8%B5%84%E6%BA%90&ckid=c1e2a51184667c72°radeFlag=0&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=1d776a12200aba5d6b043c5b507e08b7&d_curPage=0&d_pageSize=40&d_headId=1d776a12200aba5d6b043c5b507e08b7&curPage=9'}\n"
     ]
    }
   ],
   "source": [
    "href_字典 = {x.text:x.xpath('//@href')[0]  for x in r.html.xpath(xpath_翻页a)}\n",
    "print (href_字典)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "metadata": {},
   "outputs": [],
   "source": [
    "session = HTMLSession()\n",
    "\n",
    "def requests_liepin( url, params):\n",
    "    r = session.get( url , params = payload)\n",
    "\n",
    "    # 先取特定元素, 精准打击其子后辈\n",
    "    主要元素 = r.html.xpath( '//ul[@class=\"sojob-list\"]/li')\n",
    "\n",
    "    # 作为xpath字典，键为我要抓的牛肉名称，值为xpath\n",
    "    dict_xpaths={ \n",
    "        'text': {\n",
    "            'edu':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]',\n",
    "            '经验':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]/following-sibling::span',\n",
    "            '薪水':    '//div[contains(@class,\"job-info\")]/p/span[@class=\"text-warning\"]', \n",
    "            '时间':    '//div[contains(@class,\"job-info\")]/p/time/@title', \n",
    "            '职称':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '公司地点': '//div[contains(@class,\"job-info\")]/p/a',\n",
    "            '公司名称': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        },\n",
    "        'text_content': {\n",
    "        },\n",
    "        'href': {\n",
    "            '链结':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '公司URL': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        }\n",
    "    }\n",
    "\n",
    "    def get_e_text_content(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [e.xpath(_xpath_)[0].lxml.text_content() for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_text(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [\"\".join([x.strip() if type(x) is str else x.text.strip() for x in e.xpath(_xpath_)]) for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_href(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [list(e.xpath(_xpath_, first=True).absolute_links)[0] \\\n",
    "                   if len(e.xpath(_xpath_, first=True).absolute_links) >= 1  \\\n",
    "                   else \"\" for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    # 只对主要元素下进行.xpath取值\n",
    "    数据字典 = dict()\n",
    "\n",
    "    数据字典 = {k:get_e_text_content(v) for k,v in dict_xpaths['text_content'].items()}\n",
    "    数据字典.update({k:get_e_text(v) for k,v in dict_xpaths['text'].items()})\n",
    "    数据字典.update({k:get_e_href(v) for k,v in dict_xpaths['href'].items()})\n",
    "\n",
    "    数据 = pd.DataFrame(数据字典)\n",
    "    #数据.to_excel(\"20春_Web数据挖掘_week03_liepin.xlsx\", sheet_name=\"搜查结果\")\n",
    "    return (数据)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "metadata": {},
   "outputs": [],
   "source": [
    "import time\n",
    "from random import random\n",
    "\n",
    "#%%time\n",
    "time.sleep(3+4*random())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#%%time\n",
    "# B-3 多个页面+多个关键词\n",
    "import time\n",
    "from random import random\n",
    "\n",
    "url = \"https://www.liepin.com/zhaopin/\"\n",
    "xpath_翻页a = '//div[@class=\"pagerbar\"]/a[starts-with(@href,\"/zhaopin\")]'\n",
    "\n",
    "keywords = ['人力资源','影视文化','文体娱乐','服装纺织']\n",
    "list_df = list()\n",
    "\n",
    "## 第一页试探有多长的页面\n",
    "for key in keywords:\n",
    "    payload = 参数模板生成(keyword=[key], curPage=['0'])\n",
    "    df = requests_liepin( url, params = payload)\n",
    "    href_列表 = [x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)]\n",
    "    df = pd.DataFrame([ urlparse(x) for x in href_列表])\n",
    "    df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "    df_qs = df_qs.assign (curPage_int=df_qs.curPage.astype(int)) # 变成整数\n",
    "    长度 = df_qs.curPage_int.max()+1\n",
    "    参数_keyword_X_curPage = { \n",
    "        i:参数模板生成(curPage = [i], \\\n",
    "                      keyword = [key]) \\\n",
    "        for i in range(0,长度)\\\n",
    "        }\n",
    "    #print (参数_keyword_X_curPage)\n",
    "    print (key,长度)\n",
    "    \n",
    "    for k,v in 参数_keyword_X_curPage.items():\n",
    "        payload = v\n",
    "        df = requests_liepin( url, params = payload)\n",
    "        time.sleep(3+4*random())  #放慢脚步 3-7秒, 平均约5秒\n",
    "        df = df.assign (keyword = key)  # 区分  keyword    \n",
    "        df = df.assign (curPage = k)  # 区分  curPage    \n",
    "        list_df.append(df)\n",
    "        \n",
    "df_all = pd.concat(list_df).reset_index()\n",
    "df_all.index.name = '序'\n",
    "\n",
    "df_all.to_excel(\"人力资源_影视文化_文体娱乐_服装纺织_翻页数据.xlsx\",\\\n",
    "                sheet_name=\"_\".join(keywords))\n",
    "# 预估时间: 2*5秒*10 =100\n",
    "# 预估数量: 2*40*10 =800"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
